[
{
"page_no": 0,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 96.3,
"r_y0": 119.9,
"r_x1": 498.9,
"r_y1": 119.9,
"r_x2": 498.9,
"r_y2": 107.0,
"r_x3": 96.3,
"r_y3": 107.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer: Table Structure Understanding with Transformers.",
"orig": "TableFormer: Table Structure Understanding with Transformers.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 142.5,
"r_y0": 157.4,
"r_x1": 452.8,
"r_y1": 157.4,
"r_x2": 452.8,
"r_y2": 146.7,
"r_x3": 142.5,
"r_y3": 146.7,
"coord_origin": "TOPLEFT"
},
"text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar",
"orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.9,
"r_y0": 171.3,
"r_x1": 332.3,
"r_y1": 171.3,
"r_x2": 332.3,
"r_y2": 160.6,
"r_x3": 262.9,
"r_y3": 160.6,
"coord_origin": "TOPLEFT"
},
"text": "IBM Research",
"orig": "IBM Research",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.1,
"r_y0": 184.4,
"r_x1": 212.7,
"r_y1": 184.4,
"r_x2": 212.7,
"r_y2": 176.0,
"r_x3": 208.1,
"r_y3": 176.0,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 212.7,
"r_y0": 184.0,
"r_x1": 293.4,
"r_y1": 184.0,
"r_x2": 293.4,
"r_y2": 177.1,
"r_x3": 212.7,
"r_y3": 177.1,
"coord_origin": "TOPLEFT"
},
"text": "ahn,nli,mly,taa",
"orig": "ahn,nli,mly,taa",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 293.4,
"r_y0": 184.4,
"r_x1": 298.0,
"r_y1": 184.4,
"r_x2": 298.0,
"r_y2": 176.0,
"r_x3": 293.4,
"r_y3": 176.0,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 298.0,
"r_y0": 184.0,
"r_x1": 378.7,
"r_y1": 184.0,
"r_x2": 378.7,
"r_y2": 177.1,
"r_x3": 298.0,
"r_y3": 177.1,
"coord_origin": "TOPLEFT"
},
"text": "@zurich.ibm.com",
"orig": "@zurich.ibm.com",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 146.0,
"r_y0": 226.2,
"r_x1": 190.5,
"r_y1": 226.2,
"r_x2": 190.5,
"r_y2": 215.5,
"r_x3": 146.0,
"r_y3": 215.5,
"coord_origin": "TOPLEFT"
},
"text": "Abstract",
"orig": "Abstract",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 250.0,
"r_x1": 286.4,
"r_y1": 250.0,
"r_x2": 286.4,
"r_y2": 241.4,
"r_x3": 62.1,
"r_y3": 241.4,
"coord_origin": "TOPLEFT"
},
"text": "Tables organize valuable content in a concise and com-",
"orig": "Tables organize valuable content in a concise and com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 261.9,
"r_x1": 286.4,
"r_y1": 261.9,
"r_x2": 286.4,
"r_y2": 253.4,
"r_x3": 50.1,
"r_y3": 253.4,
"coord_origin": "TOPLEFT"
},
"text": "pact representation. This content is extremely valuable for",
"orig": "pact representation. This content is extremely valuable for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 273.9,
"r_x1": 286.4,
"r_y1": 273.9,
"r_x2": 286.4,
"r_y2": 265.3,
"r_x3": 50.1,
"r_y3": 265.3,
"coord_origin": "TOPLEFT"
},
"text": "systems such as search engines, Knowledge Graph\u2019s, etc,",
"orig": "systems such as search engines, Knowledge Graph\u2019s, etc,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 285.8,
"r_x1": 286.4,
"r_y1": 285.8,
"r_x2": 286.4,
"r_y2": 277.3,
"r_x3": 50.1,
"r_y3": 277.3,
"coord_origin": "TOPLEFT"
},
"text": "since they enhance their predictive capabilities. Unfortu-",
"orig": "since they enhance their predictive capabilities. Unfortu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 297.8,
"r_x1": 286.4,
"r_y1": 297.8,
"r_x2": 286.4,
"r_y2": 289.2,
"r_x3": 50.1,
"r_y3": 289.2,
"coord_origin": "TOPLEFT"
},
"text": "nately, tables come in a large variety of shapes and sizes.",
"orig": "nately, tables come in a large variety of shapes and sizes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 309.8,
"r_x1": 286.4,
"r_y1": 309.8,
"r_x2": 286.4,
"r_y2": 301.2,
"r_x3": 50.1,
"r_y3": 301.2,
"coord_origin": "TOPLEFT"
},
"text": "Furthermore, they can have complex column/row-header",
"orig": "Furthermore, they can have complex column/row-header",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 321.7,
"r_x1": 286.4,
"r_y1": 321.7,
"r_x2": 286.4,
"r_y2": 313.1,
"r_x3": 50.1,
"r_y3": 313.1,
"coord_origin": "TOPLEFT"
},
"text": "configurations, multiline rows, different variety of separa-",
"orig": "configurations, multiline rows, different variety of separa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 333.7,
"r_x1": 286.4,
"r_y1": 333.7,
"r_x2": 286.4,
"r_y2": 325.1,
"r_x3": 50.1,
"r_y3": 325.1,
"coord_origin": "TOPLEFT"
},
"text": "tion lines, missing entries, etc. As such, the correct iden-",
"orig": "tion lines, missing entries, etc. As such, the correct iden-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 345.6,
"r_x1": 286.4,
"r_y1": 345.6,
"r_x2": 286.4,
"r_y2": 337.0,
"r_x3": 50.1,
"r_y3": 337.0,
"coord_origin": "TOPLEFT"
},
"text": "tification of the table-structure from an image is a non-",
"orig": "tification of the table-structure from an image is a non-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 357.6,
"r_x1": 286.4,
"r_y1": 357.6,
"r_x2": 286.4,
"r_y2": 349.0,
"r_x3": 50.1,
"r_y3": 349.0,
"coord_origin": "TOPLEFT"
},
"text": "trivial task. In this paper, we present a new table-structure",
"orig": "trivial task. In this paper, we present a new table-structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 369.5,
"r_x1": 286.4,
"r_y1": 369.5,
"r_x2": 286.4,
"r_y2": 360.9,
"r_x3": 50.1,
"r_y3": 360.9,
"coord_origin": "TOPLEFT"
},
"text": "identification model. The latter improves the latest end-to-",
"orig": "identification model. The latter improves the latest end-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 381.5,
"r_x1": 286.4,
"r_y1": 381.5,
"r_x2": 286.4,
"r_y2": 372.9,
"r_x3": 50.1,
"r_y3": 372.9,
"coord_origin": "TOPLEFT"
},
"text": "end deep learning model (i.e. encoder-dual-decoder from",
"orig": "end deep learning model (i.e. encoder-dual-decoder from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 393.4,
"r_x1": 286.4,
"r_y1": 393.4,
"r_x2": 286.4,
"r_y2": 384.9,
"r_x3": 50.1,
"r_y3": 384.9,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet) in two significant ways. First, we introduce a",
"orig": "PubTabNet) in two significant ways. First, we introduce a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 405.4,
"r_x1": 286.4,
"r_y1": 405.4,
"r_x2": 286.4,
"r_y2": 396.8,
"r_x3": 50.1,
"r_y3": 396.8,
"coord_origin": "TOPLEFT"
},
"text": "new object detection decoder for table-cells. In this way,",
"orig": "new object detection decoder for table-cells. In this way,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 417.4,
"r_x1": 286.4,
"r_y1": 417.4,
"r_x2": 286.4,
"r_y2": 408.8,
"r_x3": 50.1,
"r_y3": 408.8,
"coord_origin": "TOPLEFT"
},
"text": "we can obtain the content of the table-cells from program-",
"orig": "we can obtain the content of the table-cells from program-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 429.3,
"r_x1": 286.4,
"r_y1": 429.3,
"r_x2": 286.4,
"r_y2": 420.7,
"r_x3": 50.1,
"r_y3": 420.7,
"coord_origin": "TOPLEFT"
},
"text": "matic PDF\u2019s directly from the PDF source and avoid the",
"orig": "matic PDF\u2019s directly from the PDF source and avoid the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 441.3,
"r_x1": 207.2,
"r_y1": 441.3,
"r_x2": 207.2,
"r_y2": 432.7,
"r_x3": 50.1,
"r_y3": 432.7,
"coord_origin": "TOPLEFT"
},
"text": "training of the custom OCR decoders.",
"orig": "training of the custom OCR decoders.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 214.1,
"r_y0": 441.3,
"r_x1": 286.4,
"r_y1": 441.3,
"r_x2": 286.4,
"r_y2": 432.7,
"r_x3": 214.1,
"r_y3": 432.7,
"coord_origin": "TOPLEFT"
},
"text": "This architectural",
"orig": "This architectural",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 453.2,
"r_x1": 286.4,
"r_y1": 453.2,
"r_x2": 286.4,
"r_y2": 444.6,
"r_x3": 50.1,
"r_y3": 444.6,
"coord_origin": "TOPLEFT"
},
"text": "change leads to more accurate table-content extraction and",
"orig": "change leads to more accurate table-content extraction and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 465.2,
"r_x1": 286.4,
"r_y1": 465.2,
"r_x2": 286.4,
"r_y2": 456.6,
"r_x3": 50.1,
"r_y3": 456.6,
"coord_origin": "TOPLEFT"
},
"text": "allows us to tackle non-english tables. Second, we replace",
"orig": "allows us to tackle non-english tables. Second, we replace",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 477.1,
"r_x1": 286.4,
"r_y1": 477.1,
"r_x2": 286.4,
"r_y2": 468.5,
"r_x3": 50.1,
"r_y3": 468.5,
"coord_origin": "TOPLEFT"
},
"text": "the LSTM decoders with transformer based decoders. This",
"orig": "the LSTM decoders with transformer based decoders. This",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 489.1,
"r_x1": 286.4,
"r_y1": 489.1,
"r_x2": 286.4,
"r_y2": 480.5,
"r_x3": 50.1,
"r_y3": 480.5,
"coord_origin": "TOPLEFT"
},
"text": "upgrade improves significantly the previous state-of-the-art",
"orig": "upgrade improves significantly the previous state-of-the-art",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 501.0,
"r_x1": 286.4,
"r_y1": 501.0,
"r_x2": 286.4,
"r_y2": 492.5,
"r_x3": 50.1,
"r_y3": 492.5,
"coord_origin": "TOPLEFT"
},
"text": "tree-editing-distance-score (TEDS) from 91% to 98.5% on",
"orig": "tree-editing-distance-score (TEDS) from 91% to 98.5% on",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 513.0,
"r_x1": 276.7,
"r_y1": 513.0,
"r_x2": 276.7,
"r_y2": 504.4,
"r_x3": 50.1,
"r_y3": 504.4,
"coord_origin": "TOPLEFT"
},
"text": "simple tables and from 88.7% to 95% on complex tables.",
"orig": "simple tables and from 88.7% to 95% on complex tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 550.7,
"r_x1": 58.1,
"r_y1": 550.7,
"r_x2": 58.1,
"r_y2": 539.9,
"r_x3": 50.1,
"r_y3": 539.9,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.8,
"r_y0": 550.7,
"r_x1": 126.9,
"r_y1": 550.7,
"r_x2": 126.9,
"r_y2": 539.9,
"r_x3": 68.8,
"r_y3": 539.9,
"coord_origin": "TOPLEFT"
},
"text": "Introduction",
"orig": "Introduction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 569.7,
"r_x1": 286.4,
"r_y1": 569.7,
"r_x2": 286.4,
"r_y2": 560.8,
"r_x3": 62.1,
"r_y3": 560.8,
"coord_origin": "TOPLEFT"
},
"text": "The occurrence of tables in documents is ubiquitous.",
"orig": "The occurrence of tables in documents is ubiquitous.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 581.6,
"r_x1": 286.4,
"r_y1": 581.6,
"r_x2": 286.4,
"r_y2": 572.7,
"r_x3": 50.1,
"r_y3": 572.7,
"coord_origin": "TOPLEFT"
},
"text": "They often summarise quantitative or factual data, which is",
"orig": "They often summarise quantitative or factual data, which is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 593.6,
"r_x1": 286.4,
"r_y1": 593.6,
"r_x2": 286.4,
"r_y2": 584.7,
"r_x3": 50.1,
"r_y3": 584.7,
"coord_origin": "TOPLEFT"
},
"text": "cumbersome to describe in verbose text but nevertheless ex-",
"orig": "cumbersome to describe in verbose text but nevertheless ex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 605.6,
"r_x1": 286.4,
"r_y1": 605.6,
"r_x2": 286.4,
"r_y2": 596.6,
"r_x3": 50.1,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "tremely valuable. Unfortunately, this compact representa-",
"orig": "tremely valuable. Unfortunately, this compact representa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 617.5,
"r_x1": 286.4,
"r_y1": 617.5,
"r_x2": 286.4,
"r_y2": 608.6,
"r_x3": 50.1,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "tion is often not easy to parse by machines. There are many",
"orig": "tion is often not easy to parse by machines. There are many",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 629.5,
"r_x1": 286.4,
"r_y1": 629.5,
"r_x2": 286.4,
"r_y2": 620.6,
"r_x3": 50.1,
"r_y3": 620.6,
"coord_origin": "TOPLEFT"
},
"text": "implicit conventions used to obtain a compact table repre-",
"orig": "implicit conventions used to obtain a compact table repre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 641.4,
"r_x1": 286.4,
"r_y1": 641.4,
"r_x2": 286.4,
"r_y2": 632.5,
"r_x3": 50.1,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": "sentation. For example, tables often have complex column-",
"orig": "sentation. For example, tables often have complex column-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 653.4,
"r_x1": 286.4,
"r_y1": 653.4,
"r_x2": 286.4,
"r_y2": 644.5,
"r_x3": 50.1,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "and row-headers in order to reduce duplicated cell content.",
"orig": "and row-headers in order to reduce duplicated cell content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 665.3,
"r_x1": 286.4,
"r_y1": 665.3,
"r_x2": 286.4,
"r_y2": 656.4,
"r_x3": 50.1,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "Lines of different shapes and sizes are leveraged to separate",
"orig": "Lines of different shapes and sizes are leveraged to separate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.3,
"r_x1": 286.4,
"r_y1": 677.3,
"r_x2": 286.4,
"r_y2": 668.4,
"r_x3": 50.1,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "content or indicate a tree structure. Additionally, tables can",
"orig": "content or indicate a tree structure. Additionally, tables can",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 689.2,
"r_x1": 286.4,
"r_y1": 689.2,
"r_x2": 286.4,
"r_y2": 680.3,
"r_x3": 50.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "also have empty/missing table-entries or multi-row textual",
"orig": "also have empty/missing table-entries or multi-row textual",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "table-entries. Fig. 1 shows a table which presents all these",
"orig": "table-entries. Fig. 1 shows a table which presents all these",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 76.4,
"r_y1": 713.2,
"r_x2": 76.4,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "issues.",
"orig": "issues.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.6,
"r_y0": 226.8,
"r_x1": 324.0,
"r_y1": 226.8,
"r_x2": 324.0,
"r_y2": 218.0,
"r_x3": 315.6,
"r_y3": 218.0,
"coord_origin": "TOPLEFT"
},
"text": "a.",
"orig": "a.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.2,
"r_y0": 226.8,
"r_x1": 408.4,
"r_y1": 226.8,
"r_x2": 408.4,
"r_y2": 218.0,
"r_x3": 328.2,
"r_y3": 218.0,
"coord_origin": "TOPLEFT"
},
"text": "Picture of a table:",
"orig": "Picture of a table:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.6,
"r_y0": 322.4,
"r_x1": 325.1,
"r_y1": 322.4,
"r_x2": 325.1,
"r_y2": 313.7,
"r_x3": 315.6,
"r_y3": 313.7,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.8,
"r_y0": 322.4,
"r_x1": 486.4,
"r_y1": 322.4,
"r_x2": 486.4,
"r_y2": 313.7,
"r_x3": 329.8,
"r_y3": 313.7,
"coord_origin": "TOPLEFT"
},
"text": "Red-annotation of bounding boxes,",
"orig": "Red-annotation of bounding boxes,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.5,
"r_y0": 333.2,
"r_x1": 472.5,
"r_y1": 333.2,
"r_x2": 472.5,
"r_y2": 324.5,
"r_x3": 326.5,
"r_y3": 324.5,
"coord_origin": "TOPLEFT"
},
"text": "Blue-predictions by TableFormer",
"orig": "Blue-predictions by TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.6,
"r_y0": 428.9,
"r_x1": 324.8,
"r_y1": 428.9,
"r_x2": 324.8,
"r_y2": 420.2,
"r_x3": 315.6,
"r_y3": 420.2,
"coord_origin": "TOPLEFT"
},
"text": "c.",
"orig": "c.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.4,
"r_y0": 428.9,
"r_x1": 491.2,
"r_y1": 428.9,
"r_x2": 491.2,
"r_y2": 420.2,
"r_x3": 329.4,
"r_y3": 420.2,
"coord_origin": "TOPLEFT"
},
"text": "Structure predicted by TableFormer:",
"orig": "Structure predicted by TableFormer:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.1,
"r_y0": 351.6,
"r_x1": 412.5,
"r_y1": 351.6,
"r_x2": 412.5,
"r_y2": 342.8,
"r_x3": 408.1,
"r_y3": 342.8,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.1,
"r_y0": 350.4,
"r_x1": 360.5,
"r_y1": 350.4,
"r_x2": 360.5,
"r_y2": 341.6,
"r_x3": 356.1,
"r_y3": 341.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.7,
"r_y0": 349.7,
"r_x1": 505.1,
"r_y1": 349.7,
"r_x2": 505.1,
"r_y2": 340.9,
"r_x3": 500.7,
"r_y3": 340.9,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.1,
"r_y0": 360.5,
"r_x1": 360.5,
"r_y1": 360.5,
"r_x2": 360.5,
"r_y2": 351.7,
"r_x3": 356.1,
"r_y3": 351.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 402.5,
"r_y0": 364.7,
"r_x1": 406.9,
"r_y1": 364.7,
"r_x2": 406.9,
"r_y2": 355.9,
"r_x3": 402.5,
"r_y3": 355.9,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.6,
"r_y0": 361.6,
"r_x1": 453.0,
"r_y1": 361.6,
"r_x2": 453.0,
"r_y2": 352.8,
"r_x3": 448.6,
"r_y3": 352.8,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 491.7,
"r_y0": 362.5,
"r_x1": 496.0,
"r_y1": 362.5,
"r_x2": 496.0,
"r_y2": 353.7,
"r_x3": 491.7,
"r_y3": 353.7,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 535.1,
"r_y0": 362.1,
"r_x1": 539.5,
"r_y1": 362.1,
"r_x2": 539.5,
"r_y2": 353.3,
"r_x3": 535.1,
"r_y3": 353.3,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.8,
"r_y0": 395.9,
"r_x1": 353.2,
"r_y1": 395.9,
"r_x2": 353.2,
"r_y2": 387.1,
"r_x3": 348.8,
"r_y3": 387.1,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.3,
"r_y0": 384.2,
"r_x1": 393.7,
"r_y1": 384.2,
"r_x2": 393.7,
"r_y2": 375.4,
"r_x3": 389.3,
"r_y3": 375.4,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.7,
"r_y0": 384.4,
"r_x1": 451.5,
"r_y1": 384.4,
"r_x2": 451.5,
"r_y2": 375.6,
"r_x3": 442.7,
"r_y3": 375.6,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.4,
"r_y0": 384.3,
"r_x1": 485.9,
"r_y1": 384.3,
"r_x2": 485.9,
"r_y2": 375.5,
"r_x3": 477.4,
"r_y3": 375.5,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 522.6,
"r_y0": 384.4,
"r_x1": 531.4,
"r_y1": 384.4,
"r_x2": 531.4,
"r_y2": 375.6,
"r_x3": 522.6,
"r_y3": 375.6,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.2,
"r_y0": 395.9,
"r_x1": 409.0,
"r_y1": 395.9,
"r_x2": 409.0,
"r_y2": 387.1,
"r_x3": 400.2,
"r_y3": 387.1,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.3,
"r_y0": 395.8,
"r_x1": 451.1,
"r_y1": 395.8,
"r_x2": 451.1,
"r_y2": 387.0,
"r_x3": 442.3,
"r_y3": 387.0,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.2,
"r_y0": 396.2,
"r_x1": 487.0,
"r_y1": 396.2,
"r_x2": 487.0,
"r_y2": 387.4,
"r_x3": 478.2,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 523.2,
"r_y0": 395.8,
"r_x1": 532.0,
"r_y1": 395.8,
"r_x2": 532.0,
"r_y2": 387.0,
"r_x3": 523.2,
"r_y3": 387.0,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.6,
"r_y0": 408.2,
"r_x1": 416.0,
"r_y1": 408.2,
"r_x2": 416.0,
"r_y2": 399.4,
"r_x3": 411.6,
"r_y3": 399.4,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 416.0,
"r_y0": 408.2,
"r_x1": 420.4,
"r_y1": 408.2,
"r_x2": 420.4,
"r_y2": 399.4,
"r_x3": 416.0,
"r_y3": 399.4,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.3,
"r_y0": 407.8,
"r_x1": 451.1,
"r_y1": 407.8,
"r_x2": 451.1,
"r_y2": 399.0,
"r_x3": 442.3,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.8,
"r_y0": 407.8,
"r_x1": 487.6,
"r_y1": 407.8,
"r_x2": 487.6,
"r_y2": 399.0,
"r_x3": 478.8,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 524.0,
"r_y0": 407.4,
"r_x1": 532.8,
"r_y1": 407.4,
"r_x2": 532.8,
"r_y2": 398.6,
"r_x3": 524.0,
"r_y3": 398.6,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 446.5,
"r_x1": 351.6,
"r_y1": 446.5,
"r_x2": 351.6,
"r_y2": 437.7,
"r_x3": 347.2,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.9,
"r_y0": 446.5,
"r_x1": 323.3,
"r_y1": 446.5,
"r_x2": 323.3,
"r_y2": 437.7,
"r_x3": 318.9,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.5,
"r_x1": 398.5,
"r_y1": 446.5,
"r_x2": 398.5,
"r_y2": 437.7,
"r_x3": 394.1,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 458.3,
"r_x1": 323.2,
"r_y1": 458.3,
"r_x2": 323.2,
"r_y2": 449.5,
"r_x3": 318.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 458.3,
"r_x1": 351.6,
"r_y1": 458.3,
"r_x2": 351.6,
"r_y2": 449.5,
"r_x3": 347.2,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.3,
"r_x1": 398.5,
"r_y1": 458.3,
"r_x2": 398.5,
"r_y2": 449.5,
"r_x3": 394.1,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 458.3,
"r_x1": 445.4,
"r_y1": 458.3,
"r_x2": 445.4,
"r_y2": 449.5,
"r_x3": 441.0,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 458.3,
"r_x1": 492.2,
"r_y1": 458.3,
"r_x2": 492.2,
"r_y2": 449.5,
"r_x3": 487.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 482.5,
"r_x1": 323.2,
"r_y1": 482.5,
"r_x2": 323.2,
"r_y2": 473.7,
"r_x3": 318.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 470.6,
"r_x1": 351.6,
"r_y1": 470.6,
"r_x2": 351.6,
"r_y2": 461.8,
"r_x3": 347.2,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.6,
"r_x1": 402.9,
"r_y1": 470.6,
"r_x2": 402.9,
"r_y2": 461.8,
"r_x3": 394.1,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 470.6,
"r_x1": 449.4,
"r_y1": 470.6,
"r_x2": 449.4,
"r_y2": 461.8,
"r_x3": 441.0,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 470.6,
"r_x1": 496.6,
"r_y1": 470.6,
"r_x2": 496.6,
"r_y2": 461.8,
"r_x3": 487.8,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 482.5,
"r_x1": 356.0,
"r_y1": 482.5,
"r_x2": 356.0,
"r_y2": 473.7,
"r_x3": 347.2,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.5,
"r_x1": 402.9,
"r_y1": 482.5,
"r_x2": 402.9,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 482.5,
"r_x1": 449.7,
"r_y1": 482.5,
"r_x2": 449.7,
"r_y2": 473.7,
"r_x3": 441.0,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 482.5,
"r_x1": 496.6,
"r_y1": 482.5,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 493.9,
"r_x1": 356.0,
"r_y1": 493.9,
"r_x2": 356.0,
"r_y2": 485.1,
"r_x3": 347.2,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.9,
"r_x1": 402.9,
"r_y1": 493.9,
"r_x2": 402.9,
"r_y2": 485.1,
"r_x3": 394.1,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 493.9,
"r_x1": 449.7,
"r_y1": 493.9,
"r_x2": 449.7,
"r_y2": 485.1,
"r_x3": 441.0,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 493.9,
"r_x1": 496.6,
"r_y1": 493.9,
"r_x2": 496.6,
"r_y2": 485.1,
"r_x3": 487.8,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.9,
"r_y0": 245.5,
"r_x1": 458.0,
"r_y1": 245.5,
"r_x2": 458.0,
"r_y2": 235.3,
"r_x3": 451.9,
"r_y3": 235.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.1,
"r_y0": 367.9,
"r_x1": 391.1,
"r_y1": 367.9,
"r_x2": 391.1,
"r_y2": 357.8,
"r_x3": 385.1,
"r_y3": 357.8,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.3,
"r_x1": 372.7,
"r_y1": 459.3,
"r_x2": 372.7,
"r_y2": 449.1,
"r_x3": 366.7,
"r_y3": 449.1,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.5,
"r_x1": 337.2,
"r_y1": 279.5,
"r_x2": 337.2,
"r_y2": 269.4,
"r_x3": 331.2,
"r_y3": 269.4,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.4,
"r_y0": 390.9,
"r_x1": 339.4,
"r_y1": 390.9,
"r_x2": 339.4,
"r_y2": 380.7,
"r_x3": 333.4,
"r_y3": 380.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.5,
"r_x1": 337.9,
"r_y1": 483.5,
"r_x2": 337.9,
"r_y2": 473.3,
"r_x3": 331.9,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.1,
"r_y0": 351.2,
"r_x1": 484.1,
"r_y1": 351.2,
"r_x2": 484.1,
"r_y2": 341.0,
"r_x3": 478.1,
"r_y3": 341.0,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.9,
"r_y0": 447.7,
"r_x1": 465.9,
"r_y1": 447.7,
"r_x2": 465.9,
"r_y2": 437.6,
"r_x3": 459.9,
"r_y3": 437.6,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.0,
"r_y0": 262.8,
"r_x1": 390.0,
"r_y1": 262.8,
"r_x2": 390.0,
"r_y2": 252.7,
"r_x3": 384.0,
"r_y3": 252.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 523.4,
"r_x1": 345.7,
"r_y1": 523.4,
"r_x2": 345.7,
"r_y2": 514.5,
"r_x3": 308.9,
"r_y3": 514.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 1:",
"orig": "Figure 1:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 353.2,
"r_y0": 523.4,
"r_x1": 545.1,
"r_y1": 523.4,
"r_x2": 545.1,
"r_y2": 514.5,
"r_x3": 353.2,
"r_y3": 514.5,
"coord_origin": "TOPLEFT"
},
"text": "Picture of a table with subtle, complex features",
"orig": "Picture of a table with subtle, complex features",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 535.4,
"r_x1": 545.1,
"r_y1": 535.4,
"r_x2": 545.1,
"r_y2": 526.5,
"r_x3": 308.9,
"r_y3": 526.5,
"coord_origin": "TOPLEFT"
},
"text": "such as (1) multi-column headers, (2) cell with multi-row",
"orig": "such as (1) multi-column headers, (2) cell with multi-row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 547.3,
"r_x1": 545.1,
"r_y1": 547.3,
"r_x2": 545.1,
"r_y2": 538.4,
"r_x3": 308.9,
"r_y3": 538.4,
"coord_origin": "TOPLEFT"
},
"text": "text and (3) cells with no content. Image from PubTabNet",
"orig": "text and (3) cells with no content. Image from PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 559.3,
"r_x1": 505.7,
"r_y1": 559.3,
"r_x2": 505.7,
"r_y2": 550.4,
"r_x3": 308.9,
"r_y3": 550.4,
"coord_origin": "TOPLEFT"
},
"text": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.",
"orig": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 593.3,
"r_x1": 545.1,
"r_y1": 593.3,
"r_x2": 545.1,
"r_y2": 584.4,
"r_x3": 320.8,
"r_y3": 584.4,
"coord_origin": "TOPLEFT"
},
"text": "Recently, significant progress has been made with vi-",
"orig": "Recently, significant progress has been made with vi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 605.3,
"r_x1": 545.1,
"r_y1": 605.3,
"r_x2": 545.1,
"r_y2": 596.4,
"r_x3": 308.9,
"r_y3": 596.4,
"coord_origin": "TOPLEFT"
},
"text": "sion based approaches to extract tables in documents. For",
"orig": "sion based approaches to extract tables in documents. For",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 617.2,
"r_x1": 545.1,
"r_y1": 617.2,
"r_x2": 545.1,
"r_y2": 608.3,
"r_x3": 308.9,
"r_y3": 608.3,
"coord_origin": "TOPLEFT"
},
"text": "the sake of completeness, the issue of table extraction from",
"orig": "the sake of completeness, the issue of table extraction from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 629.2,
"r_x1": 545.1,
"r_y1": 629.2,
"r_x2": 545.1,
"r_y2": 620.3,
"r_x3": 308.9,
"r_y3": 620.3,
"coord_origin": "TOPLEFT"
},
"text": "documents is typically decomposed into two separate chal-",
"orig": "documents is typically decomposed into two separate chal-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 641.1,
"r_x1": 353.7,
"r_y1": 641.1,
"r_x2": 353.7,
"r_y2": 632.2,
"r_x3": 308.9,
"r_y3": 632.2,
"coord_origin": "TOPLEFT"
},
"text": "lenges, i.e.",
"orig": "lenges, i.e.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 362.1,
"r_y0": 641.1,
"r_x1": 374.7,
"r_y1": 641.1,
"r_x2": 374.7,
"r_y2": 632.2,
"r_x3": 362.1,
"r_y3": 632.2,
"coord_origin": "TOPLEFT"
},
"text": "(1)",
"orig": "(1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 377.4,
"r_y0": 641.1,
"r_x1": 545.1,
"r_y1": 641.1,
"r_x2": 545.1,
"r_y2": 632.2,
"r_x3": 377.4,
"r_y3": 632.2,
"coord_origin": "TOPLEFT"
},
"text": "finding the location of the table(s) on a",
"orig": "finding the location of the table(s) on a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 653.1,
"r_x1": 545.1,
"r_y1": 653.1,
"r_x2": 545.1,
"r_y2": 644.2,
"r_x3": 308.9,
"r_y3": 644.2,
"coord_origin": "TOPLEFT"
},
"text": "document-page and (2) finding the structure of a given table",
"orig": "document-page and (2) finding the structure of a given table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 665.0,
"r_x1": 375.6,
"r_y1": 665.0,
"r_x2": 375.6,
"r_y2": 656.1,
"r_x3": 308.9,
"r_y3": 656.1,
"coord_origin": "TOPLEFT"
},
"text": "in the document.",
"orig": "in the document.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 677.3,
"r_x1": 545.1,
"r_y1": 677.3,
"r_x2": 545.1,
"r_y2": 668.4,
"r_x3": 320.8,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "The first problem is called table-location and has been",
"orig": "The first problem is called table-location and has been",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 689.2,
"r_x1": 545.1,
"r_y1": 689.2,
"r_x2": 545.1,
"r_y2": 680.3,
"r_x3": 308.9,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-",
"orig": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 308.9,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "of-the-art object-detection networks (e.g. YOLO and later",
"orig": "of-the-art object-detection networks (e.g. YOLO and later",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 545.1,
"r_y1": 713.2,
"r_x2": 545.1,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "on Mask-RCNN [9]). For all practical purposes, it can be",
"orig": "on Mask-RCNN [9]). For all practical purposes, it can be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 18.3,
"r_y0": 560.0,
"r_x1": 36.3,
"r_y1": 560.0,
"r_x2": 36.3,
"r_y2": 207.8,
"r_x3": 18.3,
"r_y3": 207.8,
"coord_origin": "TOPLEFT"
},
"text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022",
"orig": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 8,
"label": "section_header",
"bbox": {
"l": 96.3,
"t": 107.0,
"r": 498.9,
"b": 119.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 96.3,
"r_y0": 119.9,
"r_x1": 498.9,
"r_y1": 119.9,
"r_x2": 498.9,
"r_y2": 107.0,
"r_x3": 96.3,
"r_y3": 107.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer: Table Structure Understanding with Transformers.",
"orig": "TableFormer: Table Structure Understanding with Transformers.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 13,
"label": "section_header",
"bbox": {
"l": 142.5,
"t": 146.7,
"r": 452.8,
"b": 171.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.76,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 142.5,
"r_y0": 157.4,
"r_x1": 452.8,
"r_y1": 157.4,
"r_x2": 452.8,
"r_y2": 146.7,
"r_x3": 142.5,
"r_y3": 146.7,
"coord_origin": "TOPLEFT"
},
"text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar",
"orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.9,
"r_y0": 171.3,
"r_x1": 332.3,
"r_y1": 171.3,
"r_x2": 332.3,
"r_y2": 160.6,
"r_x3": 262.9,
"r_y3": 160.6,
"coord_origin": "TOPLEFT"
},
"text": "IBM Research",
"orig": "IBM Research",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 25,
"label": "key_value_region",
"bbox": {
"l": 208.1,
"t": 176.0,
"r": 378.7,
"b": 184.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.49,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.1,
"r_y0": 184.4,
"r_x1": 212.7,
"r_y1": 184.4,
"r_x2": 212.7,
"r_y2": 176.0,
"r_x3": 208.1,
"r_y3": 176.0,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 212.7,
"r_y0": 184.0,
"r_x1": 293.4,
"r_y1": 184.0,
"r_x2": 293.4,
"r_y2": 177.1,
"r_x3": 212.7,
"r_y3": 177.1,
"coord_origin": "TOPLEFT"
},
"text": "ahn,nli,mly,taa",
"orig": "ahn,nli,mly,taa",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 293.4,
"r_y0": 184.4,
"r_x1": 298.0,
"r_y1": 184.4,
"r_x2": 298.0,
"r_y2": 176.0,
"r_x3": 293.4,
"r_y3": 176.0,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 298.0,
"r_y0": 184.0,
"r_x1": 378.7,
"r_y1": 184.0,
"r_x2": 378.7,
"r_y2": 177.1,
"r_x3": 298.0,
"r_y3": 177.1,
"coord_origin": "TOPLEFT"
},
"text": "@zurich.ibm.com",
"orig": "@zurich.ibm.com",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 7,
"label": "text",
"bbox": {
"l": 208.1,
"t": 176.0,
"r": 378.7,
"b": 184.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.1,
"r_y0": 184.4,
"r_x1": 212.7,
"r_y1": 184.4,
"r_x2": 212.7,
"r_y2": 176.0,
"r_x3": 208.1,
"r_y3": 176.0,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 212.7,
"r_y0": 184.0,
"r_x1": 293.4,
"r_y1": 184.0,
"r_x2": 293.4,
"r_y2": 177.1,
"r_x3": 212.7,
"r_y3": 177.1,
"coord_origin": "TOPLEFT"
},
"text": "ahn,nli,mly,taa",
"orig": "ahn,nli,mly,taa",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 293.4,
"r_y0": 184.4,
"r_x1": 298.0,
"r_y1": 184.4,
"r_x2": 298.0,
"r_y2": 176.0,
"r_x3": 293.4,
"r_y3": 176.0,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 298.0,
"r_y0": 184.0,
"r_x1": 378.7,
"r_y1": 184.0,
"r_x2": 378.7,
"r_y2": 177.1,
"r_x3": 298.0,
"r_y3": 177.1,
"coord_origin": "TOPLEFT"
},
"text": "@zurich.ibm.com",
"orig": "@zurich.ibm.com",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 5,
"label": "section_header",
"bbox": {
"l": 146.0,
"t": 215.5,
"r": 190.5,
"b": 226.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 146.0,
"r_y0": 226.2,
"r_x1": 190.5,
"r_y1": 226.2,
"r_x2": 190.5,
"r_y2": 215.5,
"r_x3": 146.0,
"r_y3": 215.5,
"coord_origin": "TOPLEFT"
},
"text": "Abstract",
"orig": "Abstract",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "text",
"bbox": {
"l": 50.1,
"t": 241.4,
"r": 286.4,
"b": 513.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 250.0,
"r_x1": 286.4,
"r_y1": 250.0,
"r_x2": 286.4,
"r_y2": 241.4,
"r_x3": 62.1,
"r_y3": 241.4,
"coord_origin": "TOPLEFT"
},
"text": "Tables organize valuable content in a concise and com-",
"orig": "Tables organize valuable content in a concise and com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 261.9,
"r_x1": 286.4,
"r_y1": 261.9,
"r_x2": 286.4,
"r_y2": 253.4,
"r_x3": 50.1,
"r_y3": 253.4,
"coord_origin": "TOPLEFT"
},
"text": "pact representation. This content is extremely valuable for",
"orig": "pact representation. This content is extremely valuable for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 273.9,
"r_x1": 286.4,
"r_y1": 273.9,
"r_x2": 286.4,
"r_y2": 265.3,
"r_x3": 50.1,
"r_y3": 265.3,
"coord_origin": "TOPLEFT"
},
"text": "systems such as search engines, Knowledge Graph\u2019s, etc,",
"orig": "systems such as search engines, Knowledge Graph\u2019s, etc,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 285.8,
"r_x1": 286.4,
"r_y1": 285.8,
"r_x2": 286.4,
"r_y2": 277.3,
"r_x3": 50.1,
"r_y3": 277.3,
"coord_origin": "TOPLEFT"
},
"text": "since they enhance their predictive capabilities. Unfortu-",
"orig": "since they enhance their predictive capabilities. Unfortu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 297.8,
"r_x1": 286.4,
"r_y1": 297.8,
"r_x2": 286.4,
"r_y2": 289.2,
"r_x3": 50.1,
"r_y3": 289.2,
"coord_origin": "TOPLEFT"
},
"text": "nately, tables come in a large variety of shapes and sizes.",
"orig": "nately, tables come in a large variety of shapes and sizes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 309.8,
"r_x1": 286.4,
"r_y1": 309.8,
"r_x2": 286.4,
"r_y2": 301.2,
"r_x3": 50.1,
"r_y3": 301.2,
"coord_origin": "TOPLEFT"
},
"text": "Furthermore, they can have complex column/row-header",
"orig": "Furthermore, they can have complex column/row-header",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 321.7,
"r_x1": 286.4,
"r_y1": 321.7,
"r_x2": 286.4,
"r_y2": 313.1,
"r_x3": 50.1,
"r_y3": 313.1,
"coord_origin": "TOPLEFT"
},
"text": "configurations, multiline rows, different variety of separa-",
"orig": "configurations, multiline rows, different variety of separa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 333.7,
"r_x1": 286.4,
"r_y1": 333.7,
"r_x2": 286.4,
"r_y2": 325.1,
"r_x3": 50.1,
"r_y3": 325.1,
"coord_origin": "TOPLEFT"
},
"text": "tion lines, missing entries, etc. As such, the correct iden-",
"orig": "tion lines, missing entries, etc. As such, the correct iden-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 345.6,
"r_x1": 286.4,
"r_y1": 345.6,
"r_x2": 286.4,
"r_y2": 337.0,
"r_x3": 50.1,
"r_y3": 337.0,
"coord_origin": "TOPLEFT"
},
"text": "tification of the table-structure from an image is a non-",
"orig": "tification of the table-structure from an image is a non-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 357.6,
"r_x1": 286.4,
"r_y1": 357.6,
"r_x2": 286.4,
"r_y2": 349.0,
"r_x3": 50.1,
"r_y3": 349.0,
"coord_origin": "TOPLEFT"
},
"text": "trivial task. In this paper, we present a new table-structure",
"orig": "trivial task. In this paper, we present a new table-structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 369.5,
"r_x1": 286.4,
"r_y1": 369.5,
"r_x2": 286.4,
"r_y2": 360.9,
"r_x3": 50.1,
"r_y3": 360.9,
"coord_origin": "TOPLEFT"
},
"text": "identification model. The latter improves the latest end-to-",
"orig": "identification model. The latter improves the latest end-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 381.5,
"r_x1": 286.4,
"r_y1": 381.5,
"r_x2": 286.4,
"r_y2": 372.9,
"r_x3": 50.1,
"r_y3": 372.9,
"coord_origin": "TOPLEFT"
},
"text": "end deep learning model (i.e. encoder-dual-decoder from",
"orig": "end deep learning model (i.e. encoder-dual-decoder from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 393.4,
"r_x1": 286.4,
"r_y1": 393.4,
"r_x2": 286.4,
"r_y2": 384.9,
"r_x3": 50.1,
"r_y3": 384.9,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet) in two significant ways. First, we introduce a",
"orig": "PubTabNet) in two significant ways. First, we introduce a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 405.4,
"r_x1": 286.4,
"r_y1": 405.4,
"r_x2": 286.4,
"r_y2": 396.8,
"r_x3": 50.1,
"r_y3": 396.8,
"coord_origin": "TOPLEFT"
},
"text": "new object detection decoder for table-cells. In this way,",
"orig": "new object detection decoder for table-cells. In this way,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 417.4,
"r_x1": 286.4,
"r_y1": 417.4,
"r_x2": 286.4,
"r_y2": 408.8,
"r_x3": 50.1,
"r_y3": 408.8,
"coord_origin": "TOPLEFT"
},
"text": "we can obtain the content of the table-cells from program-",
"orig": "we can obtain the content of the table-cells from program-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 429.3,
"r_x1": 286.4,
"r_y1": 429.3,
"r_x2": 286.4,
"r_y2": 420.7,
"r_x3": 50.1,
"r_y3": 420.7,
"coord_origin": "TOPLEFT"
},
"text": "matic PDF\u2019s directly from the PDF source and avoid the",
"orig": "matic PDF\u2019s directly from the PDF source and avoid the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 441.3,
"r_x1": 207.2,
"r_y1": 441.3,
"r_x2": 207.2,
"r_y2": 432.7,
"r_x3": 50.1,
"r_y3": 432.7,
"coord_origin": "TOPLEFT"
},
"text": "training of the custom OCR decoders.",
"orig": "training of the custom OCR decoders.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 214.1,
"r_y0": 441.3,
"r_x1": 286.4,
"r_y1": 441.3,
"r_x2": 286.4,
"r_y2": 432.7,
"r_x3": 214.1,
"r_y3": 432.7,
"coord_origin": "TOPLEFT"
},
"text": "This architectural",
"orig": "This architectural",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 453.2,
"r_x1": 286.4,
"r_y1": 453.2,
"r_x2": 286.4,
"r_y2": 444.6,
"r_x3": 50.1,
"r_y3": 444.6,
"coord_origin": "TOPLEFT"
},
"text": "change leads to more accurate table-content extraction and",
"orig": "change leads to more accurate table-content extraction and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 465.2,
"r_x1": 286.4,
"r_y1": 465.2,
"r_x2": 286.4,
"r_y2": 456.6,
"r_x3": 50.1,
"r_y3": 456.6,
"coord_origin": "TOPLEFT"
},
"text": "allows us to tackle non-english tables. Second, we replace",
"orig": "allows us to tackle non-english tables. Second, we replace",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 477.1,
"r_x1": 286.4,
"r_y1": 477.1,
"r_x2": 286.4,
"r_y2": 468.5,
"r_x3": 50.1,
"r_y3": 468.5,
"coord_origin": "TOPLEFT"
},
"text": "the LSTM decoders with transformer based decoders. This",
"orig": "the LSTM decoders with transformer based decoders. This",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 489.1,
"r_x1": 286.4,
"r_y1": 489.1,
"r_x2": 286.4,
"r_y2": 480.5,
"r_x3": 50.1,
"r_y3": 480.5,
"coord_origin": "TOPLEFT"
},
"text": "upgrade improves significantly the previous state-of-the-art",
"orig": "upgrade improves significantly the previous state-of-the-art",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 501.0,
"r_x1": 286.4,
"r_y1": 501.0,
"r_x2": 286.4,
"r_y2": 492.5,
"r_x3": 50.1,
"r_y3": 492.5,
"coord_origin": "TOPLEFT"
},
"text": "tree-editing-distance-score (TEDS) from 91% to 98.5% on",
"orig": "tree-editing-distance-score (TEDS) from 91% to 98.5% on",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 513.0,
"r_x1": 276.7,
"r_y1": 513.0,
"r_x2": 276.7,
"r_y2": 504.4,
"r_x3": 50.1,
"r_y3": 504.4,
"coord_origin": "TOPLEFT"
},
"text": "simple tables and from 88.7% to 95% on complex tables.",
"orig": "simple tables and from 88.7% to 95% on complex tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 539.9,
"r": 126.9,
"b": 550.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 550.7,
"r_x1": 58.1,
"r_y1": 550.7,
"r_x2": 58.1,
"r_y2": 539.9,
"r_x3": 50.1,
"r_y3": 539.9,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.8,
"r_y0": 550.7,
"r_x1": 126.9,
"r_y1": 550.7,
"r_x2": 126.9,
"r_y2": 539.9,
"r_x3": 68.8,
"r_y3": 539.9,
"coord_origin": "TOPLEFT"
},
"text": "Introduction",
"orig": "Introduction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "text",
"bbox": {
"l": 50.1,
"t": 560.8,
"r": 286.4,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 569.7,
"r_x1": 286.4,
"r_y1": 569.7,
"r_x2": 286.4,
"r_y2": 560.8,
"r_x3": 62.1,
"r_y3": 560.8,
"coord_origin": "TOPLEFT"
},
"text": "The occurrence of tables in documents is ubiquitous.",
"orig": "The occurrence of tables in documents is ubiquitous.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 581.6,
"r_x1": 286.4,
"r_y1": 581.6,
"r_x2": 286.4,
"r_y2": 572.7,
"r_x3": 50.1,
"r_y3": 572.7,
"coord_origin": "TOPLEFT"
},
"text": "They often summarise quantitative or factual data, which is",
"orig": "They often summarise quantitative or factual data, which is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 593.6,
"r_x1": 286.4,
"r_y1": 593.6,
"r_x2": 286.4,
"r_y2": 584.7,
"r_x3": 50.1,
"r_y3": 584.7,
"coord_origin": "TOPLEFT"
},
"text": "cumbersome to describe in verbose text but nevertheless ex-",
"orig": "cumbersome to describe in verbose text but nevertheless ex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 605.6,
"r_x1": 286.4,
"r_y1": 605.6,
"r_x2": 286.4,
"r_y2": 596.6,
"r_x3": 50.1,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "tremely valuable. Unfortunately, this compact representa-",
"orig": "tremely valuable. Unfortunately, this compact representa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 617.5,
"r_x1": 286.4,
"r_y1": 617.5,
"r_x2": 286.4,
"r_y2": 608.6,
"r_x3": 50.1,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "tion is often not easy to parse by machines. There are many",
"orig": "tion is often not easy to parse by machines. There are many",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 629.5,
"r_x1": 286.4,
"r_y1": 629.5,
"r_x2": 286.4,
"r_y2": 620.6,
"r_x3": 50.1,
"r_y3": 620.6,
"coord_origin": "TOPLEFT"
},
"text": "implicit conventions used to obtain a compact table repre-",
"orig": "implicit conventions used to obtain a compact table repre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 641.4,
"r_x1": 286.4,
"r_y1": 641.4,
"r_x2": 286.4,
"r_y2": 632.5,
"r_x3": 50.1,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": "sentation. For example, tables often have complex column-",
"orig": "sentation. For example, tables often have complex column-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 653.4,
"r_x1": 286.4,
"r_y1": 653.4,
"r_x2": 286.4,
"r_y2": 644.5,
"r_x3": 50.1,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "and row-headers in order to reduce duplicated cell content.",
"orig": "and row-headers in order to reduce duplicated cell content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 665.3,
"r_x1": 286.4,
"r_y1": 665.3,
"r_x2": 286.4,
"r_y2": 656.4,
"r_x3": 50.1,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "Lines of different shapes and sizes are leveraged to separate",
"orig": "Lines of different shapes and sizes are leveraged to separate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.3,
"r_x1": 286.4,
"r_y1": 677.3,
"r_x2": 286.4,
"r_y2": 668.4,
"r_x3": 50.1,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "content or indicate a tree structure. Additionally, tables can",
"orig": "content or indicate a tree structure. Additionally, tables can",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 689.2,
"r_x1": 286.4,
"r_y1": 689.2,
"r_x2": 286.4,
"r_y2": 680.3,
"r_x3": 50.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "also have empty/missing table-entries or multi-row textual",
"orig": "also have empty/missing table-entries or multi-row textual",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "table-entries. Fig. 1 shows a table which presents all these",
"orig": "table-entries. Fig. 1 shows a table which presents all these",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 76.4,
"r_y1": 713.2,
"r_x2": 76.4,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "issues.",
"orig": "issues.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 14,
"label": "section_header",
"bbox": {
"l": 315.6,
"t": 218.0,
"r": 408.4,
"b": 226.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.67,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.6,
"r_y0": 226.8,
"r_x1": 324.0,
"r_y1": 226.8,
"r_x2": 324.0,
"r_y2": 218.0,
"r_x3": 315.6,
"r_y3": 218.0,
"coord_origin": "TOPLEFT"
},
"text": "a.",
"orig": "a.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.2,
"r_y0": 226.8,
"r_x1": 408.4,
"r_y1": 226.8,
"r_x2": 408.4,
"r_y2": 218.0,
"r_x3": 328.2,
"r_y3": 218.0,
"coord_origin": "TOPLEFT"
},
"text": "Picture of a table:",
"orig": "Picture of a table:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 17,
"label": "list_item",
"bbox": {
"l": 315.6,
"t": 313.7,
"r": 486.4,
"b": 333.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.6,
"r_y0": 322.4,
"r_x1": 325.1,
"r_y1": 322.4,
"r_x2": 325.1,
"r_y2": 313.7,
"r_x3": 315.6,
"r_y3": 313.7,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.8,
"r_y0": 322.4,
"r_x1": 486.4,
"r_y1": 322.4,
"r_x2": 486.4,
"r_y2": 313.7,
"r_x3": 329.8,
"r_y3": 313.7,
"coord_origin": "TOPLEFT"
},
"text": "Red-annotation of bounding boxes,",
"orig": "Red-annotation of bounding boxes,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.5,
"r_y0": 333.2,
"r_x1": 472.5,
"r_y1": 333.2,
"r_x2": 472.5,
"r_y2": 324.5,
"r_x3": 326.5,
"r_y3": 324.5,
"coord_origin": "TOPLEFT"
},
"text": "Blue-predictions by TableFormer",
"orig": "Blue-predictions by TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 18,
"label": "list_item",
"bbox": {
"l": 315.6,
"t": 420.2,
"r": 491.2,
"b": 428.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.6,
"r_y0": 428.9,
"r_x1": 324.8,
"r_y1": 428.9,
"r_x2": 324.8,
"r_y2": 420.2,
"r_x3": 315.6,
"r_y3": 420.2,
"coord_origin": "TOPLEFT"
},
"text": "c.",
"orig": "c.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.4,
"r_y0": 428.9,
"r_x1": 491.2,
"r_y1": 428.9,
"r_x2": 491.2,
"r_y2": 420.2,
"r_x3": 329.4,
"r_y3": 420.2,
"coord_origin": "TOPLEFT"
},
"text": "Structure predicted by TableFormer:",
"orig": "Structure predicted by TableFormer:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 10,
"label": "picture",
"bbox": {
"l": 314.8,
"t": 338.1,
"r": 539.2,
"b": 410.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.87,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.1,
"r_y0": 351.6,
"r_x1": 412.5,
"r_y1": 351.6,
"r_x2": 412.5,
"r_y2": 342.8,
"r_x3": 408.1,
"r_y3": 342.8,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.1,
"r_y0": 350.4,
"r_x1": 360.5,
"r_y1": 350.4,
"r_x2": 360.5,
"r_y2": 341.6,
"r_x3": 356.1,
"r_y3": 341.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.7,
"r_y0": 349.7,
"r_x1": 505.1,
"r_y1": 349.7,
"r_x2": 505.1,
"r_y2": 340.9,
"r_x3": 500.7,
"r_y3": 340.9,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.1,
"r_y0": 360.5,
"r_x1": 360.5,
"r_y1": 360.5,
"r_x2": 360.5,
"r_y2": 351.7,
"r_x3": 356.1,
"r_y3": 351.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 402.5,
"r_y0": 364.7,
"r_x1": 406.9,
"r_y1": 364.7,
"r_x2": 406.9,
"r_y2": 355.9,
"r_x3": 402.5,
"r_y3": 355.9,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.6,
"r_y0": 361.6,
"r_x1": 453.0,
"r_y1": 361.6,
"r_x2": 453.0,
"r_y2": 352.8,
"r_x3": 448.6,
"r_y3": 352.8,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 491.7,
"r_y0": 362.5,
"r_x1": 496.0,
"r_y1": 362.5,
"r_x2": 496.0,
"r_y2": 353.7,
"r_x3": 491.7,
"r_y3": 353.7,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 535.1,
"r_y0": 362.1,
"r_x1": 539.5,
"r_y1": 362.1,
"r_x2": 539.5,
"r_y2": 353.3,
"r_x3": 535.1,
"r_y3": 353.3,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.8,
"r_y0": 395.9,
"r_x1": 353.2,
"r_y1": 395.9,
"r_x2": 353.2,
"r_y2": 387.1,
"r_x3": 348.8,
"r_y3": 387.1,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.3,
"r_y0": 384.2,
"r_x1": 393.7,
"r_y1": 384.2,
"r_x2": 393.7,
"r_y2": 375.4,
"r_x3": 389.3,
"r_y3": 375.4,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.7,
"r_y0": 384.4,
"r_x1": 451.5,
"r_y1": 384.4,
"r_x2": 451.5,
"r_y2": 375.6,
"r_x3": 442.7,
"r_y3": 375.6,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.4,
"r_y0": 384.3,
"r_x1": 485.9,
"r_y1": 384.3,
"r_x2": 485.9,
"r_y2": 375.5,
"r_x3": 477.4,
"r_y3": 375.5,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 522.6,
"r_y0": 384.4,
"r_x1": 531.4,
"r_y1": 384.4,
"r_x2": 531.4,
"r_y2": 375.6,
"r_x3": 522.6,
"r_y3": 375.6,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.2,
"r_y0": 395.9,
"r_x1": 409.0,
"r_y1": 395.9,
"r_x2": 409.0,
"r_y2": 387.1,
"r_x3": 400.2,
"r_y3": 387.1,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.3,
"r_y0": 395.8,
"r_x1": 451.1,
"r_y1": 395.8,
"r_x2": 451.1,
"r_y2": 387.0,
"r_x3": 442.3,
"r_y3": 387.0,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.2,
"r_y0": 396.2,
"r_x1": 487.0,
"r_y1": 396.2,
"r_x2": 487.0,
"r_y2": 387.4,
"r_x3": 478.2,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 523.2,
"r_y0": 395.8,
"r_x1": 532.0,
"r_y1": 395.8,
"r_x2": 532.0,
"r_y2": 387.0,
"r_x3": 523.2,
"r_y3": 387.0,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.6,
"r_y0": 408.2,
"r_x1": 416.0,
"r_y1": 408.2,
"r_x2": 416.0,
"r_y2": 399.4,
"r_x3": 411.6,
"r_y3": 399.4,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 416.0,
"r_y0": 408.2,
"r_x1": 420.4,
"r_y1": 408.2,
"r_x2": 420.4,
"r_y2": 399.4,
"r_x3": 416.0,
"r_y3": 399.4,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.3,
"r_y0": 407.8,
"r_x1": 451.1,
"r_y1": 407.8,
"r_x2": 451.1,
"r_y2": 399.0,
"r_x3": 442.3,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.8,
"r_y0": 407.8,
"r_x1": 487.6,
"r_y1": 407.8,
"r_x2": 487.6,
"r_y2": 399.0,
"r_x3": 478.8,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 524.0,
"r_y0": 407.4,
"r_x1": 532.8,
"r_y1": 407.4,
"r_x2": 532.8,
"r_y2": 398.6,
"r_x3": 524.0,
"r_y3": 398.6,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.1,
"r_y0": 367.9,
"r_x1": 391.1,
"r_y1": 367.9,
"r_x2": 391.1,
"r_y2": 357.8,
"r_x3": 385.1,
"r_y3": 357.8,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.4,
"r_y0": 390.9,
"r_x1": 339.4,
"r_y1": 390.9,
"r_x2": 339.4,
"r_y2": 380.7,
"r_x3": 333.4,
"r_y3": 380.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.1,
"r_y0": 351.2,
"r_x1": 484.1,
"r_y1": 351.2,
"r_x2": 484.1,
"r_y2": 341.0,
"r_x3": 478.1,
"r_y3": 341.0,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 40,
"label": "text",
"bbox": {
"l": 408.1,
"t": 342.8,
"r": 412.5,
"b": 351.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.1,
"r_y0": 351.6,
"r_x1": 412.5,
"r_y1": 351.6,
"r_x2": 412.5,
"r_y2": 342.8,
"r_x3": 408.1,
"r_y3": 342.8,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 356.1,
"t": 341.6,
"r": 360.5,
"b": 350.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.1,
"r_y0": 350.4,
"r_x1": 360.5,
"r_y1": 350.4,
"r_x2": 360.5,
"r_y2": 341.6,
"r_x3": 356.1,
"r_y3": 341.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 500.7,
"t": 340.9,
"r": 505.1,
"b": 349.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.7,
"r_y0": 349.7,
"r_x1": 505.1,
"r_y1": 349.7,
"r_x2": 505.1,
"r_y2": 340.9,
"r_x3": 500.7,
"r_y3": 340.9,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 356.1,
"t": 351.7,
"r": 360.5,
"b": 360.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.1,
"r_y0": 360.5,
"r_x1": 360.5,
"r_y1": 360.5,
"r_x2": 360.5,
"r_y2": 351.7,
"r_x3": 356.1,
"r_y3": 351.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 402.5,
"t": 355.9,
"r": 406.9,
"b": 364.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 402.5,
"r_y0": 364.7,
"r_x1": 406.9,
"r_y1": 364.7,
"r_x2": 406.9,
"r_y2": 355.9,
"r_x3": 402.5,
"r_y3": 355.9,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 448.6,
"t": 352.8,
"r": 453.0,
"b": 361.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.6,
"r_y0": 361.6,
"r_x1": 453.0,
"r_y1": 361.6,
"r_x2": 453.0,
"r_y2": 352.8,
"r_x3": 448.6,
"r_y3": 352.8,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 491.7,
"t": 353.7,
"r": 496.0,
"b": 362.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 491.7,
"r_y0": 362.5,
"r_x1": 496.0,
"r_y1": 362.5,
"r_x2": 496.0,
"r_y2": 353.7,
"r_x3": 491.7,
"r_y3": 353.7,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 535.1,
"t": 353.3,
"r": 539.5,
"b": 362.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 535.1,
"r_y0": 362.1,
"r_x1": 539.5,
"r_y1": 362.1,
"r_x2": 539.5,
"r_y2": 353.3,
"r_x3": 535.1,
"r_y3": 353.3,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 348.8,
"t": 387.1,
"r": 353.2,
"b": 395.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.8,
"r_y0": 395.9,
"r_x1": 353.2,
"r_y1": 395.9,
"r_x2": 353.2,
"r_y2": 387.1,
"r_x3": 348.8,
"r_y3": 387.1,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 389.3,
"t": 375.4,
"r": 393.7,
"b": 384.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.3,
"r_y0": 384.2,
"r_x1": 393.7,
"r_y1": 384.2,
"r_x2": 393.7,
"r_y2": 375.4,
"r_x3": 389.3,
"r_y3": 375.4,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 442.7,
"t": 375.6,
"r": 451.5,
"b": 384.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.7,
"r_y0": 384.4,
"r_x1": 451.5,
"r_y1": 384.4,
"r_x2": 451.5,
"r_y2": 375.6,
"r_x3": 442.7,
"r_y3": 375.6,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 51,
"label": "text",
"bbox": {
"l": 477.4,
"t": 375.5,
"r": 485.9,
"b": 384.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.4,
"r_y0": 384.3,
"r_x1": 485.9,
"r_y1": 384.3,
"r_x2": 485.9,
"r_y2": 375.5,
"r_x3": 477.4,
"r_y3": 375.5,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 52,
"label": "text",
"bbox": {
"l": 522.6,
"t": 375.6,
"r": 531.4,
"b": 384.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 522.6,
"r_y0": 384.4,
"r_x1": 531.4,
"r_y1": 384.4,
"r_x2": 531.4,
"r_y2": 375.6,
"r_x3": 522.6,
"r_y3": 375.6,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 53,
"label": "text",
"bbox": {
"l": 400.2,
"t": 387.1,
"r": 409.0,
"b": 395.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.2,
"r_y0": 395.9,
"r_x1": 409.0,
"r_y1": 395.9,
"r_x2": 409.0,
"r_y2": 387.1,
"r_x3": 400.2,
"r_y3": 387.1,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 54,
"label": "text",
"bbox": {
"l": 442.3,
"t": 387.0,
"r": 451.1,
"b": 395.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.3,
"r_y0": 395.8,
"r_x1": 451.1,
"r_y1": 395.8,
"r_x2": 451.1,
"r_y2": 387.0,
"r_x3": 442.3,
"r_y3": 387.0,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 55,
"label": "text",
"bbox": {
"l": 478.2,
"t": 387.4,
"r": 487.0,
"b": 396.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.2,
"r_y0": 396.2,
"r_x1": 487.0,
"r_y1": 396.2,
"r_x2": 487.0,
"r_y2": 387.4,
"r_x3": 478.2,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 523.2,
"t": 387.0,
"r": 532.0,
"b": 395.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 523.2,
"r_y0": 395.8,
"r_x1": 532.0,
"r_y1": 395.8,
"r_x2": 532.0,
"r_y2": 387.0,
"r_x3": 523.2,
"r_y3": 387.0,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 411.6,
"t": 399.4,
"r": 416.0,
"b": 408.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.6,
"r_y0": 408.2,
"r_x1": 416.0,
"r_y1": 408.2,
"r_x2": 416.0,
"r_y2": 399.4,
"r_x3": 411.6,
"r_y3": 399.4,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 416.0,
"t": 399.4,
"r": 420.4,
"b": 408.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 416.0,
"r_y0": 408.2,
"r_x1": 420.4,
"r_y1": 408.2,
"r_x2": 420.4,
"r_y2": 399.4,
"r_x3": 416.0,
"r_y3": 399.4,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 442.3,
"t": 399.0,
"r": 451.1,
"b": 407.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.3,
"r_y0": 407.8,
"r_x1": 451.1,
"r_y1": 407.8,
"r_x2": 451.1,
"r_y2": 399.0,
"r_x3": 442.3,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 478.8,
"t": 399.0,
"r": 487.6,
"b": 407.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.8,
"r_y0": 407.8,
"r_x1": 487.6,
"r_y1": 407.8,
"r_x2": 487.6,
"r_y2": 399.0,
"r_x3": 478.8,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 524.0,
"t": 398.6,
"r": 532.8,
"b": 407.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 524.0,
"r_y0": 407.4,
"r_x1": 532.8,
"r_y1": 407.4,
"r_x2": 532.8,
"r_y2": 398.6,
"r_x3": 524.0,
"r_y3": 398.6,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 385.1,
"t": 357.8,
"r": 391.1,
"b": 367.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.1,
"r_y0": 367.9,
"r_x1": 391.1,
"r_y1": 367.9,
"r_x2": 391.1,
"r_y2": 357.8,
"r_x3": 385.1,
"r_y3": 357.8,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 333.4,
"t": 380.7,
"r": 339.4,
"b": 390.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.4,
"r_y0": 390.9,
"r_x1": 339.4,
"r_y1": 390.9,
"r_x2": 339.4,
"r_y2": 380.7,
"r_x3": 333.4,
"r_y3": 380.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 478.1,
"t": 341.0,
"r": 484.1,
"b": 351.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.1,
"r_y0": 351.2,
"r_x1": 484.1,
"r_y1": 351.2,
"r_x2": 484.1,
"r_y2": 341.0,
"r_x3": 478.1,
"r_y3": 341.0,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 23,
"label": "picture",
"bbox": {
"l": 315.7,
"t": 433.8,
"r": 536.8,
"b": 496.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.51,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 446.5,
"r_x1": 351.6,
"r_y1": 446.5,
"r_x2": 351.6,
"r_y2": 437.7,
"r_x3": 347.2,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.9,
"r_y0": 446.5,
"r_x1": 323.3,
"r_y1": 446.5,
"r_x2": 323.3,
"r_y2": 437.7,
"r_x3": 318.9,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.5,
"r_x1": 398.5,
"r_y1": 446.5,
"r_x2": 398.5,
"r_y2": 437.7,
"r_x3": 394.1,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 458.3,
"r_x1": 323.2,
"r_y1": 458.3,
"r_x2": 323.2,
"r_y2": 449.5,
"r_x3": 318.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 458.3,
"r_x1": 351.6,
"r_y1": 458.3,
"r_x2": 351.6,
"r_y2": 449.5,
"r_x3": 347.2,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.3,
"r_x1": 398.5,
"r_y1": 458.3,
"r_x2": 398.5,
"r_y2": 449.5,
"r_x3": 394.1,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 458.3,
"r_x1": 445.4,
"r_y1": 458.3,
"r_x2": 445.4,
"r_y2": 449.5,
"r_x3": 441.0,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 458.3,
"r_x1": 492.2,
"r_y1": 458.3,
"r_x2": 492.2,
"r_y2": 449.5,
"r_x3": 487.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 482.5,
"r_x1": 323.2,
"r_y1": 482.5,
"r_x2": 323.2,
"r_y2": 473.7,
"r_x3": 318.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 470.6,
"r_x1": 351.6,
"r_y1": 470.6,
"r_x2": 351.6,
"r_y2": 461.8,
"r_x3": 347.2,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.6,
"r_x1": 402.9,
"r_y1": 470.6,
"r_x2": 402.9,
"r_y2": 461.8,
"r_x3": 394.1,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 470.6,
"r_x1": 449.4,
"r_y1": 470.6,
"r_x2": 449.4,
"r_y2": 461.8,
"r_x3": 441.0,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 470.6,
"r_x1": 496.6,
"r_y1": 470.6,
"r_x2": 496.6,
"r_y2": 461.8,
"r_x3": 487.8,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 482.5,
"r_x1": 356.0,
"r_y1": 482.5,
"r_x2": 356.0,
"r_y2": 473.7,
"r_x3": 347.2,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.5,
"r_x1": 402.9,
"r_y1": 482.5,
"r_x2": 402.9,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 482.5,
"r_x1": 449.7,
"r_y1": 482.5,
"r_x2": 449.7,
"r_y2": 473.7,
"r_x3": 441.0,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 482.5,
"r_x1": 496.6,
"r_y1": 482.5,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 493.9,
"r_x1": 356.0,
"r_y1": 493.9,
"r_x2": 356.0,
"r_y2": 485.1,
"r_x3": 347.2,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.9,
"r_x1": 402.9,
"r_y1": 493.9,
"r_x2": 402.9,
"r_y2": 485.1,
"r_x3": 394.1,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 493.9,
"r_x1": 449.7,
"r_y1": 493.9,
"r_x2": 449.7,
"r_y2": 485.1,
"r_x3": 441.0,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 493.9,
"r_x1": 496.6,
"r_y1": 493.9,
"r_x2": 496.6,
"r_y2": 485.1,
"r_x3": 487.8,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.3,
"r_x1": 372.7,
"r_y1": 459.3,
"r_x2": 372.7,
"r_y2": 449.1,
"r_x3": 366.7,
"r_y3": 449.1,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.5,
"r_x1": 337.9,
"r_y1": 483.5,
"r_x2": 337.9,
"r_y2": 473.3,
"r_x3": 331.9,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.9,
"r_y0": 447.7,
"r_x1": 465.9,
"r_y1": 447.7,
"r_x2": 465.9,
"r_y2": 437.6,
"r_x3": 459.9,
"r_y3": 437.6,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 62,
"label": "text",
"bbox": {
"l": 347.2,
"t": 437.7,
"r": 351.6,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 446.5,
"r_x1": 351.6,
"r_y1": 446.5,
"r_x2": 351.6,
"r_y2": 437.7,
"r_x3": 347.2,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 318.9,
"t": 437.7,
"r": 323.3,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.9,
"r_y0": 446.5,
"r_x1": 323.3,
"r_y1": 446.5,
"r_x2": 323.3,
"r_y2": 437.7,
"r_x3": 318.9,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 394.1,
"t": 437.7,
"r": 398.5,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.5,
"r_x1": 398.5,
"r_y1": 446.5,
"r_x2": 398.5,
"r_y2": 437.7,
"r_x3": 394.1,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 318.8,
"t": 449.5,
"r": 323.2,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 458.3,
"r_x1": 323.2,
"r_y1": 458.3,
"r_x2": 323.2,
"r_y2": 449.5,
"r_x3": 318.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 347.2,
"t": 449.5,
"r": 351.6,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 458.3,
"r_x1": 351.6,
"r_y1": 458.3,
"r_x2": 351.6,
"r_y2": 449.5,
"r_x3": 347.2,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 394.1,
"t": 449.5,
"r": 398.5,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.3,
"r_x1": 398.5,
"r_y1": 458.3,
"r_x2": 398.5,
"r_y2": 449.5,
"r_x3": 394.1,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 441.0,
"t": 449.5,
"r": 445.4,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 458.3,
"r_x1": 445.4,
"r_y1": 458.3,
"r_x2": 445.4,
"r_y2": 449.5,
"r_x3": 441.0,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 487.8,
"t": 449.5,
"r": 492.2,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 458.3,
"r_x1": 492.2,
"r_y1": 458.3,
"r_x2": 492.2,
"r_y2": 449.5,
"r_x3": 487.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 318.8,
"t": 473.7,
"r": 323.2,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 482.5,
"r_x1": 323.2,
"r_y1": 482.5,
"r_x2": 323.2,
"r_y2": 473.7,
"r_x3": 318.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 347.2,
"t": 461.8,
"r": 351.6,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 470.6,
"r_x1": 351.6,
"r_y1": 470.6,
"r_x2": 351.6,
"r_y2": 461.8,
"r_x3": 347.2,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 394.1,
"t": 461.8,
"r": 402.9,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.6,
"r_x1": 402.9,
"r_y1": 470.6,
"r_x2": 402.9,
"r_y2": 461.8,
"r_x3": 394.1,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 441.0,
"t": 461.8,
"r": 449.4,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 470.6,
"r_x1": 449.4,
"r_y1": 470.6,
"r_x2": 449.4,
"r_y2": 461.8,
"r_x3": 441.0,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 487.8,
"t": 461.8,
"r": 496.6,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 470.6,
"r_x1": 496.6,
"r_y1": 470.6,
"r_x2": 496.6,
"r_y2": 461.8,
"r_x3": 487.8,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 347.2,
"t": 473.7,
"r": 356.0,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 482.5,
"r_x1": 356.0,
"r_y1": 482.5,
"r_x2": 356.0,
"r_y2": 473.7,
"r_x3": 347.2,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 394.1,
"t": 473.7,
"r": 402.9,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.5,
"r_x1": 402.9,
"r_y1": 482.5,
"r_x2": 402.9,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 441.0,
"t": 473.7,
"r": 449.7,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 482.5,
"r_x1": 449.7,
"r_y1": 482.5,
"r_x2": 449.7,
"r_y2": 473.7,
"r_x3": 441.0,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 487.8,
"t": 473.7,
"r": 496.6,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 482.5,
"r_x1": 496.6,
"r_y1": 482.5,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 347.2,
"t": 485.1,
"r": 356.0,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 493.9,
"r_x1": 356.0,
"r_y1": 493.9,
"r_x2": 356.0,
"r_y2": 485.1,
"r_x3": 347.2,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 394.1,
"t": 485.1,
"r": 402.9,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.9,
"r_x1": 402.9,
"r_y1": 493.9,
"r_x2": 402.9,
"r_y2": 485.1,
"r_x3": 394.1,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 441.0,
"t": 485.1,
"r": 449.7,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 493.9,
"r_x1": 449.7,
"r_y1": 493.9,
"r_x2": 449.7,
"r_y2": 485.1,
"r_x3": 441.0,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 487.8,
"t": 485.1,
"r": 496.6,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 493.9,
"r_x1": 496.6,
"r_y1": 493.9,
"r_x2": 496.6,
"r_y2": 485.1,
"r_x3": 487.8,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 366.7,
"t": 449.1,
"r": 372.7,
"b": 459.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.3,
"r_x1": 372.7,
"r_y1": 459.3,
"r_x2": 372.7,
"r_y2": 449.1,
"r_x3": 366.7,
"r_y3": 449.1,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 331.9,
"t": 473.3,
"r": 337.9,
"b": 483.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.5,
"r_x1": 337.9,
"r_y1": 483.5,
"r_x2": 337.9,
"r_y2": 473.3,
"r_x3": 331.9,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 459.9,
"t": 437.6,
"r": 465.9,
"b": 447.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.9,
"r_y0": 447.7,
"r_x1": 465.9,
"r_y1": 447.7,
"r_x2": 465.9,
"r_y2": 437.6,
"r_x3": 459.9,
"r_y3": 437.6,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 11,
"label": "table",
"bbox": {
"l": 315.7,
"t": 433.8,
"r": 536.8,
"b": 496.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.81,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 446.5,
"r_x1": 351.6,
"r_y1": 446.5,
"r_x2": 351.6,
"r_y2": 437.7,
"r_x3": 347.2,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.9,
"r_y0": 446.5,
"r_x1": 323.3,
"r_y1": 446.5,
"r_x2": 323.3,
"r_y2": 437.7,
"r_x3": 318.9,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.5,
"r_x1": 398.5,
"r_y1": 446.5,
"r_x2": 398.5,
"r_y2": 437.7,
"r_x3": 394.1,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 458.3,
"r_x1": 323.2,
"r_y1": 458.3,
"r_x2": 323.2,
"r_y2": 449.5,
"r_x3": 318.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 458.3,
"r_x1": 351.6,
"r_y1": 458.3,
"r_x2": 351.6,
"r_y2": 449.5,
"r_x3": 347.2,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.3,
"r_x1": 398.5,
"r_y1": 458.3,
"r_x2": 398.5,
"r_y2": 449.5,
"r_x3": 394.1,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 458.3,
"r_x1": 445.4,
"r_y1": 458.3,
"r_x2": 445.4,
"r_y2": 449.5,
"r_x3": 441.0,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 458.3,
"r_x1": 492.2,
"r_y1": 458.3,
"r_x2": 492.2,
"r_y2": 449.5,
"r_x3": 487.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 482.5,
"r_x1": 323.2,
"r_y1": 482.5,
"r_x2": 323.2,
"r_y2": 473.7,
"r_x3": 318.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 470.6,
"r_x1": 351.6,
"r_y1": 470.6,
"r_x2": 351.6,
"r_y2": 461.8,
"r_x3": 347.2,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.6,
"r_x1": 402.9,
"r_y1": 470.6,
"r_x2": 402.9,
"r_y2": 461.8,
"r_x3": 394.1,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 470.6,
"r_x1": 449.4,
"r_y1": 470.6,
"r_x2": 449.4,
"r_y2": 461.8,
"r_x3": 441.0,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 470.6,
"r_x1": 496.6,
"r_y1": 470.6,
"r_x2": 496.6,
"r_y2": 461.8,
"r_x3": 487.8,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 482.5,
"r_x1": 356.0,
"r_y1": 482.5,
"r_x2": 356.0,
"r_y2": 473.7,
"r_x3": 347.2,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.5,
"r_x1": 402.9,
"r_y1": 482.5,
"r_x2": 402.9,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 482.5,
"r_x1": 449.7,
"r_y1": 482.5,
"r_x2": 449.7,
"r_y2": 473.7,
"r_x3": 441.0,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 482.5,
"r_x1": 496.6,
"r_y1": 482.5,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 493.9,
"r_x1": 356.0,
"r_y1": 493.9,
"r_x2": 356.0,
"r_y2": 485.1,
"r_x3": 347.2,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.9,
"r_x1": 402.9,
"r_y1": 493.9,
"r_x2": 402.9,
"r_y2": 485.1,
"r_x3": 394.1,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 493.9,
"r_x1": 449.7,
"r_y1": 493.9,
"r_x2": 449.7,
"r_y2": 485.1,
"r_x3": 441.0,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 493.9,
"r_x1": 496.6,
"r_y1": 493.9,
"r_x2": 496.6,
"r_y2": 485.1,
"r_x3": 487.8,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.3,
"r_x1": 372.7,
"r_y1": 459.3,
"r_x2": 372.7,
"r_y2": 449.1,
"r_x3": 366.7,
"r_y3": 449.1,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.5,
"r_x1": 337.9,
"r_y1": 483.5,
"r_x2": 337.9,
"r_y2": 473.3,
"r_x3": 331.9,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.9,
"r_y0": 447.7,
"r_x1": 465.9,
"r_y1": 447.7,
"r_x2": 465.9,
"r_y2": 437.6,
"r_x3": 459.9,
"r_y3": 437.6,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 62,
"label": "text",
"bbox": {
"l": 347.2,
"t": 437.7,
"r": 351.6,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 446.5,
"r_x1": 351.6,
"r_y1": 446.5,
"r_x2": 351.6,
"r_y2": 437.7,
"r_x3": 347.2,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 318.9,
"t": 437.7,
"r": 323.3,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.9,
"r_y0": 446.5,
"r_x1": 323.3,
"r_y1": 446.5,
"r_x2": 323.3,
"r_y2": 437.7,
"r_x3": 318.9,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 394.1,
"t": 437.7,
"r": 398.5,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.5,
"r_x1": 398.5,
"r_y1": 446.5,
"r_x2": 398.5,
"r_y2": 437.7,
"r_x3": 394.1,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 318.8,
"t": 449.5,
"r": 323.2,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 458.3,
"r_x1": 323.2,
"r_y1": 458.3,
"r_x2": 323.2,
"r_y2": 449.5,
"r_x3": 318.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 347.2,
"t": 449.5,
"r": 351.6,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 458.3,
"r_x1": 351.6,
"r_y1": 458.3,
"r_x2": 351.6,
"r_y2": 449.5,
"r_x3": 347.2,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 394.1,
"t": 449.5,
"r": 398.5,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.3,
"r_x1": 398.5,
"r_y1": 458.3,
"r_x2": 398.5,
"r_y2": 449.5,
"r_x3": 394.1,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 441.0,
"t": 449.5,
"r": 445.4,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 458.3,
"r_x1": 445.4,
"r_y1": 458.3,
"r_x2": 445.4,
"r_y2": 449.5,
"r_x3": 441.0,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 487.8,
"t": 449.5,
"r": 492.2,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 458.3,
"r_x1": 492.2,
"r_y1": 458.3,
"r_x2": 492.2,
"r_y2": 449.5,
"r_x3": 487.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 318.8,
"t": 473.7,
"r": 323.2,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 482.5,
"r_x1": 323.2,
"r_y1": 482.5,
"r_x2": 323.2,
"r_y2": 473.7,
"r_x3": 318.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 347.2,
"t": 461.8,
"r": 351.6,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 470.6,
"r_x1": 351.6,
"r_y1": 470.6,
"r_x2": 351.6,
"r_y2": 461.8,
"r_x3": 347.2,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 394.1,
"t": 461.8,
"r": 402.9,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.6,
"r_x1": 402.9,
"r_y1": 470.6,
"r_x2": 402.9,
"r_y2": 461.8,
"r_x3": 394.1,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 441.0,
"t": 461.8,
"r": 449.4,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 470.6,
"r_x1": 449.4,
"r_y1": 470.6,
"r_x2": 449.4,
"r_y2": 461.8,
"r_x3": 441.0,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 487.8,
"t": 461.8,
"r": 496.6,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 470.6,
"r_x1": 496.6,
"r_y1": 470.6,
"r_x2": 496.6,
"r_y2": 461.8,
"r_x3": 487.8,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 347.2,
"t": 473.7,
"r": 356.0,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 482.5,
"r_x1": 356.0,
"r_y1": 482.5,
"r_x2": 356.0,
"r_y2": 473.7,
"r_x3": 347.2,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 394.1,
"t": 473.7,
"r": 402.9,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.5,
"r_x1": 402.9,
"r_y1": 482.5,
"r_x2": 402.9,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 441.0,
"t": 473.7,
"r": 449.7,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 482.5,
"r_x1": 449.7,
"r_y1": 482.5,
"r_x2": 449.7,
"r_y2": 473.7,
"r_x3": 441.0,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 487.8,
"t": 473.7,
"r": 496.6,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 482.5,
"r_x1": 496.6,
"r_y1": 482.5,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 347.2,
"t": 485.1,
"r": 356.0,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 493.9,
"r_x1": 356.0,
"r_y1": 493.9,
"r_x2": 356.0,
"r_y2": 485.1,
"r_x3": 347.2,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 394.1,
"t": 485.1,
"r": 402.9,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.9,
"r_x1": 402.9,
"r_y1": 493.9,
"r_x2": 402.9,
"r_y2": 485.1,
"r_x3": 394.1,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 441.0,
"t": 485.1,
"r": 449.7,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 493.9,
"r_x1": 449.7,
"r_y1": 493.9,
"r_x2": 449.7,
"r_y2": 485.1,
"r_x3": 441.0,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 487.8,
"t": 485.1,
"r": 496.6,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 493.9,
"r_x1": 496.6,
"r_y1": 493.9,
"r_x2": 496.6,
"r_y2": 485.1,
"r_x3": 487.8,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 366.7,
"t": 449.1,
"r": 372.7,
"b": 459.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.3,
"r_x1": 372.7,
"r_y1": 459.3,
"r_x2": 372.7,
"r_y2": 449.1,
"r_x3": 366.7,
"r_y3": 449.1,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 331.9,
"t": 473.3,
"r": 337.9,
"b": 483.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.5,
"r_x1": 337.9,
"r_y1": 483.5,
"r_x2": 337.9,
"r_y2": 473.3,
"r_x3": 331.9,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 459.9,
"t": 437.6,
"r": 465.9,
"b": 447.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.9,
"r_y0": 447.7,
"r_x1": 465.9,
"r_y1": 447.7,
"r_x2": 465.9,
"r_y2": 437.6,
"r_x3": 459.9,
"r_y3": 437.6,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 16,
"label": "picture",
"bbox": {
"l": 315.7,
"t": 228.7,
"r": 537.1,
"b": 302.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.61,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.9,
"r_y0": 245.5,
"r_x1": 458.0,
"r_y1": 245.5,
"r_x2": 458.0,
"r_y2": 235.3,
"r_x3": 451.9,
"r_y3": 235.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.5,
"r_x1": 337.2,
"r_y1": 279.5,
"r_x2": 337.2,
"r_y2": 269.4,
"r_x3": 331.2,
"r_y3": 269.4,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.0,
"r_y0": 262.8,
"r_x1": 390.0,
"r_y1": 262.8,
"r_x2": 390.0,
"r_y2": 252.7,
"r_x3": 384.0,
"r_y3": 252.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 83,
"label": "text",
"bbox": {
"l": 451.9,
"t": 235.3,
"r": 458.0,
"b": 245.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.9,
"r_y0": 245.5,
"r_x1": 458.0,
"r_y1": 245.5,
"r_x2": 458.0,
"r_y2": 235.3,
"r_x3": 451.9,
"r_y3": 235.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 331.2,
"t": 269.4,
"r": 337.2,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.5,
"r_x1": 337.2,
"r_y1": 279.5,
"r_x2": 337.2,
"r_y2": 269.4,
"r_x3": 331.2,
"r_y3": 269.4,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 384.0,
"t": 252.7,
"r": 390.0,
"b": 262.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.0,
"r_y0": 262.8,
"r_x1": 390.0,
"r_y1": 262.8,
"r_x2": 390.0,
"r_y2": 252.7,
"r_x3": 384.0,
"r_y3": 252.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 15,
"label": "table",
"bbox": {
"l": 315.7,
"t": 228.7,
"r": 537.1,
"b": 302.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.65,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.9,
"r_y0": 245.5,
"r_x1": 458.0,
"r_y1": 245.5,
"r_x2": 458.0,
"r_y2": 235.3,
"r_x3": 451.9,
"r_y3": 235.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.5,
"r_x1": 337.2,
"r_y1": 279.5,
"r_x2": 337.2,
"r_y2": 269.4,
"r_x3": 331.2,
"r_y3": 269.4,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.0,
"r_y0": 262.8,
"r_x1": 390.0,
"r_y1": 262.8,
"r_x2": 390.0,
"r_y2": 252.7,
"r_x3": 384.0,
"r_y3": 252.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 83,
"label": "text",
"bbox": {
"l": 451.9,
"t": 235.3,
"r": 458.0,
"b": 245.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.9,
"r_y0": 245.5,
"r_x1": 458.0,
"r_y1": 245.5,
"r_x2": 458.0,
"r_y2": 235.3,
"r_x3": 451.9,
"r_y3": 235.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 331.2,
"t": 269.4,
"r": 337.2,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.5,
"r_x1": 337.2,
"r_y1": 279.5,
"r_x2": 337.2,
"r_y2": 269.4,
"r_x3": 331.2,
"r_y3": 269.4,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 384.0,
"t": 252.7,
"r": 390.0,
"b": 262.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.0,
"r_y0": 262.8,
"r_x1": 390.0,
"r_y1": 262.8,
"r_x2": 390.0,
"r_y2": 252.7,
"r_x3": 384.0,
"r_y3": 252.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 6,
"label": "caption",
"bbox": {
"l": 308.9,
"t": 514.5,
"r": 545.1,
"b": 559.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.92,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 523.4,
"r_x1": 345.7,
"r_y1": 523.4,
"r_x2": 345.7,
"r_y2": 514.5,
"r_x3": 308.9,
"r_y3": 514.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 1:",
"orig": "Figure 1:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 353.2,
"r_y0": 523.4,
"r_x1": 545.1,
"r_y1": 523.4,
"r_x2": 545.1,
"r_y2": 514.5,
"r_x3": 353.2,
"r_y3": 514.5,
"coord_origin": "TOPLEFT"
},
"text": "Picture of a table with subtle, complex features",
"orig": "Picture of a table with subtle, complex features",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 535.4,
"r_x1": 545.1,
"r_y1": 535.4,
"r_x2": 545.1,
"r_y2": 526.5,
"r_x3": 308.9,
"r_y3": 526.5,
"coord_origin": "TOPLEFT"
},
"text": "such as (1) multi-column headers, (2) cell with multi-row",
"orig": "such as (1) multi-column headers, (2) cell with multi-row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 547.3,
"r_x1": 545.1,
"r_y1": 547.3,
"r_x2": 545.1,
"r_y2": 538.4,
"r_x3": 308.9,
"r_y3": 538.4,
"coord_origin": "TOPLEFT"
},
"text": "text and (3) cells with no content. Image from PubTabNet",
"orig": "text and (3) cells with no content. Image from PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 559.3,
"r_x1": 505.7,
"r_y1": 559.3,
"r_x2": 505.7,
"r_y2": 550.4,
"r_x3": 308.9,
"r_y3": 550.4,
"coord_origin": "TOPLEFT"
},
"text": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.",
"orig": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 0,
"label": "text",
"bbox": {
"l": 308.9,
"t": 584.4,
"r": 545.1,
"b": 665.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 593.3,
"r_x1": 545.1,
"r_y1": 593.3,
"r_x2": 545.1,
"r_y2": 584.4,
"r_x3": 320.8,
"r_y3": 584.4,
"coord_origin": "TOPLEFT"
},
"text": "Recently, significant progress has been made with vi-",
"orig": "Recently, significant progress has been made with vi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 605.3,
"r_x1": 545.1,
"r_y1": 605.3,
"r_x2": 545.1,
"r_y2": 596.4,
"r_x3": 308.9,
"r_y3": 596.4,
"coord_origin": "TOPLEFT"
},
"text": "sion based approaches to extract tables in documents. For",
"orig": "sion based approaches to extract tables in documents. For",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 617.2,
"r_x1": 545.1,
"r_y1": 617.2,
"r_x2": 545.1,
"r_y2": 608.3,
"r_x3": 308.9,
"r_y3": 608.3,
"coord_origin": "TOPLEFT"
},
"text": "the sake of completeness, the issue of table extraction from",
"orig": "the sake of completeness, the issue of table extraction from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 629.2,
"r_x1": 545.1,
"r_y1": 629.2,
"r_x2": 545.1,
"r_y2": 620.3,
"r_x3": 308.9,
"r_y3": 620.3,
"coord_origin": "TOPLEFT"
},
"text": "documents is typically decomposed into two separate chal-",
"orig": "documents is typically decomposed into two separate chal-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 641.1,
"r_x1": 353.7,
"r_y1": 641.1,
"r_x2": 353.7,
"r_y2": 632.2,
"r_x3": 308.9,
"r_y3": 632.2,
"coord_origin": "TOPLEFT"
},
"text": "lenges, i.e.",
"orig": "lenges, i.e.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 362.1,
"r_y0": 641.1,
"r_x1": 374.7,
"r_y1": 641.1,
"r_x2": 374.7,
"r_y2": 632.2,
"r_x3": 362.1,
"r_y3": 632.2,
"coord_origin": "TOPLEFT"
},
"text": "(1)",
"orig": "(1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 377.4,
"r_y0": 641.1,
"r_x1": 545.1,
"r_y1": 641.1,
"r_x2": 545.1,
"r_y2": 632.2,
"r_x3": 377.4,
"r_y3": 632.2,
"coord_origin": "TOPLEFT"
},
"text": "finding the location of the table(s) on a",
"orig": "finding the location of the table(s) on a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 653.1,
"r_x1": 545.1,
"r_y1": 653.1,
"r_x2": 545.1,
"r_y2": 644.2,
"r_x3": 308.9,
"r_y3": 644.2,
"coord_origin": "TOPLEFT"
},
"text": "document-page and (2) finding the structure of a given table",
"orig": "document-page and (2) finding the structure of a given table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 665.0,
"r_x1": 375.6,
"r_y1": 665.0,
"r_x2": 375.6,
"r_y2": 656.1,
"r_x3": 308.9,
"r_y3": 656.1,
"coord_origin": "TOPLEFT"
},
"text": "in the document.",
"orig": "in the document.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "text",
"bbox": {
"l": 308.9,
"t": 668.4,
"r": 545.1,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 677.3,
"r_x1": 545.1,
"r_y1": 677.3,
"r_x2": 545.1,
"r_y2": 668.4,
"r_x3": 320.8,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "The first problem is called table-location and has been",
"orig": "The first problem is called table-location and has been",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 689.2,
"r_x1": 545.1,
"r_y1": 689.2,
"r_x2": 545.1,
"r_y2": 680.3,
"r_x3": 308.9,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-",
"orig": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 308.9,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "of-the-art object-detection networks (e.g. YOLO and later",
"orig": "of-the-art object-detection networks (e.g. YOLO and later",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 545.1,
"r_y1": 713.2,
"r_x2": 545.1,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "on Mask-RCNN [9]). For all practical purposes, it can be",
"orig": "on Mask-RCNN [9]). For all practical purposes, it can be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 12,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.8,
"cells": [
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 9,
"label": "page_header",
"bbox": {
"l": 18.3,
"t": 207.8,
"r": 36.3,
"b": 560.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 18.3,
"r_y0": 560.0,
"r_x1": 36.3,
"r_y1": 560.0,
"r_x2": 36.3,
"r_y2": 207.8,
"r_x3": 18.3,
"r_y3": 207.8,
"coord_origin": "TOPLEFT"
},
"text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022",
"orig": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"tablestructure": {
"table_map": {
"11": {
"label": "table",
"id": 11,
"page_no": 0,
"cluster": {
"id": 11,
"label": "table",
"bbox": {
"l": 315.7,
"t": 433.8,
"r": 536.8,
"b": 496.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.81,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 446.5,
"r_x1": 351.6,
"r_y1": 446.5,
"r_x2": 351.6,
"r_y2": 437.7,
"r_x3": 347.2,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.9,
"r_y0": 446.5,
"r_x1": 323.3,
"r_y1": 446.5,
"r_x2": 323.3,
"r_y2": 437.7,
"r_x3": 318.9,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.5,
"r_x1": 398.5,
"r_y1": 446.5,
"r_x2": 398.5,
"r_y2": 437.7,
"r_x3": 394.1,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 458.3,
"r_x1": 323.2,
"r_y1": 458.3,
"r_x2": 323.2,
"r_y2": 449.5,
"r_x3": 318.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 458.3,
"r_x1": 351.6,
"r_y1": 458.3,
"r_x2": 351.6,
"r_y2": 449.5,
"r_x3": 347.2,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.3,
"r_x1": 398.5,
"r_y1": 458.3,
"r_x2": 398.5,
"r_y2": 449.5,
"r_x3": 394.1,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 458.3,
"r_x1": 445.4,
"r_y1": 458.3,
"r_x2": 445.4,
"r_y2": 449.5,
"r_x3": 441.0,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 458.3,
"r_x1": 492.2,
"r_y1": 458.3,
"r_x2": 492.2,
"r_y2": 449.5,
"r_x3": 487.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 482.5,
"r_x1": 323.2,
"r_y1": 482.5,
"r_x2": 323.2,
"r_y2": 473.7,
"r_x3": 318.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 470.6,
"r_x1": 351.6,
"r_y1": 470.6,
"r_x2": 351.6,
"r_y2": 461.8,
"r_x3": 347.2,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.6,
"r_x1": 402.9,
"r_y1": 470.6,
"r_x2": 402.9,
"r_y2": 461.8,
"r_x3": 394.1,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 470.6,
"r_x1": 449.4,
"r_y1": 470.6,
"r_x2": 449.4,
"r_y2": 461.8,
"r_x3": 441.0,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 470.6,
"r_x1": 496.6,
"r_y1": 470.6,
"r_x2": 496.6,
"r_y2": 461.8,
"r_x3": 487.8,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 482.5,
"r_x1": 356.0,
"r_y1": 482.5,
"r_x2": 356.0,
"r_y2": 473.7,
"r_x3": 347.2,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.5,
"r_x1": 402.9,
"r_y1": 482.5,
"r_x2": 402.9,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 482.5,
"r_x1": 449.7,
"r_y1": 482.5,
"r_x2": 449.7,
"r_y2": 473.7,
"r_x3": 441.0,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 482.5,
"r_x1": 496.6,
"r_y1": 482.5,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 493.9,
"r_x1": 356.0,
"r_y1": 493.9,
"r_x2": 356.0,
"r_y2": 485.1,
"r_x3": 347.2,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.9,
"r_x1": 402.9,
"r_y1": 493.9,
"r_x2": 402.9,
"r_y2": 485.1,
"r_x3": 394.1,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 493.9,
"r_x1": 449.7,
"r_y1": 493.9,
"r_x2": 449.7,
"r_y2": 485.1,
"r_x3": 441.0,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 493.9,
"r_x1": 496.6,
"r_y1": 493.9,
"r_x2": 496.6,
"r_y2": 485.1,
"r_x3": 487.8,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.3,
"r_x1": 372.7,
"r_y1": 459.3,
"r_x2": 372.7,
"r_y2": 449.1,
"r_x3": 366.7,
"r_y3": 449.1,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.5,
"r_x1": 337.9,
"r_y1": 483.5,
"r_x2": 337.9,
"r_y2": 473.3,
"r_x3": 331.9,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.9,
"r_y0": 447.7,
"r_x1": 465.9,
"r_y1": 447.7,
"r_x2": 465.9,
"r_y2": 437.6,
"r_x3": 459.9,
"r_y3": 437.6,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 62,
"label": "text",
"bbox": {
"l": 347.2,
"t": 437.7,
"r": 351.6,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 446.5,
"r_x1": 351.6,
"r_y1": 446.5,
"r_x2": 351.6,
"r_y2": 437.7,
"r_x3": 347.2,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 318.9,
"t": 437.7,
"r": 323.3,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.9,
"r_y0": 446.5,
"r_x1": 323.3,
"r_y1": 446.5,
"r_x2": 323.3,
"r_y2": 437.7,
"r_x3": 318.9,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 394.1,
"t": 437.7,
"r": 398.5,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.5,
"r_x1": 398.5,
"r_y1": 446.5,
"r_x2": 398.5,
"r_y2": 437.7,
"r_x3": 394.1,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 318.8,
"t": 449.5,
"r": 323.2,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 458.3,
"r_x1": 323.2,
"r_y1": 458.3,
"r_x2": 323.2,
"r_y2": 449.5,
"r_x3": 318.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 347.2,
"t": 449.5,
"r": 351.6,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 458.3,
"r_x1": 351.6,
"r_y1": 458.3,
"r_x2": 351.6,
"r_y2": 449.5,
"r_x3": 347.2,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 394.1,
"t": 449.5,
"r": 398.5,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.3,
"r_x1": 398.5,
"r_y1": 458.3,
"r_x2": 398.5,
"r_y2": 449.5,
"r_x3": 394.1,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 441.0,
"t": 449.5,
"r": 445.4,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 458.3,
"r_x1": 445.4,
"r_y1": 458.3,
"r_x2": 445.4,
"r_y2": 449.5,
"r_x3": 441.0,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 487.8,
"t": 449.5,
"r": 492.2,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 458.3,
"r_x1": 492.2,
"r_y1": 458.3,
"r_x2": 492.2,
"r_y2": 449.5,
"r_x3": 487.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 318.8,
"t": 473.7,
"r": 323.2,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 482.5,
"r_x1": 323.2,
"r_y1": 482.5,
"r_x2": 323.2,
"r_y2": 473.7,
"r_x3": 318.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 347.2,
"t": 461.8,
"r": 351.6,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 470.6,
"r_x1": 351.6,
"r_y1": 470.6,
"r_x2": 351.6,
"r_y2": 461.8,
"r_x3": 347.2,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 394.1,
"t": 461.8,
"r": 402.9,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.6,
"r_x1": 402.9,
"r_y1": 470.6,
"r_x2": 402.9,
"r_y2": 461.8,
"r_x3": 394.1,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 441.0,
"t": 461.8,
"r": 449.4,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 470.6,
"r_x1": 449.4,
"r_y1": 470.6,
"r_x2": 449.4,
"r_y2": 461.8,
"r_x3": 441.0,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 487.8,
"t": 461.8,
"r": 496.6,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 470.6,
"r_x1": 496.6,
"r_y1": 470.6,
"r_x2": 496.6,
"r_y2": 461.8,
"r_x3": 487.8,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 347.2,
"t": 473.7,
"r": 356.0,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 482.5,
"r_x1": 356.0,
"r_y1": 482.5,
"r_x2": 356.0,
"r_y2": 473.7,
"r_x3": 347.2,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 394.1,
"t": 473.7,
"r": 402.9,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.5,
"r_x1": 402.9,
"r_y1": 482.5,
"r_x2": 402.9,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 441.0,
"t": 473.7,
"r": 449.7,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 482.5,
"r_x1": 449.7,
"r_y1": 482.5,
"r_x2": 449.7,
"r_y2": 473.7,
"r_x3": 441.0,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 487.8,
"t": 473.7,
"r": 496.6,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 482.5,
"r_x1": 496.6,
"r_y1": 482.5,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 347.2,
"t": 485.1,
"r": 356.0,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 493.9,
"r_x1": 356.0,
"r_y1": 493.9,
"r_x2": 356.0,
"r_y2": 485.1,
"r_x3": 347.2,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 394.1,
"t": 485.1,
"r": 402.9,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.9,
"r_x1": 402.9,
"r_y1": 493.9,
"r_x2": 402.9,
"r_y2": 485.1,
"r_x3": 394.1,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 441.0,
"t": 485.1,
"r": 449.7,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 493.9,
"r_x1": 449.7,
"r_y1": 493.9,
"r_x2": 449.7,
"r_y2": 485.1,
"r_x3": 441.0,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 487.8,
"t": 485.1,
"r": 496.6,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 493.9,
"r_x1": 496.6,
"r_y1": 493.9,
"r_x2": 496.6,
"r_y2": 485.1,
"r_x3": 487.8,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 366.7,
"t": 449.1,
"r": 372.7,
"b": 459.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.3,
"r_x1": 372.7,
"r_y1": 459.3,
"r_x2": 372.7,
"r_y2": 449.1,
"r_x3": 366.7,
"r_y3": 449.1,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 331.9,
"t": 473.3,
"r": 337.9,
"b": 483.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.5,
"r_x1": 337.9,
"r_y1": 483.5,
"r_x2": 337.9,
"r_y2": 473.3,
"r_x3": 331.9,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 459.9,
"t": 437.6,
"r": 465.9,
"b": 447.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.9,
"r_y0": 447.7,
"r_x1": 465.9,
"r_y1": 447.7,
"r_x2": 465.9,
"r_y2": 437.6,
"r_x3": 459.9,
"r_y3": 437.6,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"lcel",
"lcel",
"lcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 5,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 347.2,
"t": 437.7,
"r": 351.6,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 4,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 5,
"text": "1 2 1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 318.9,
"t": 437.7,
"r": 323.3,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 318.8,
"t": 449.5,
"r": 323.2,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.2,
"t": 449.1,
"r": 372.7,
"b": 459.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "4 3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 449.5,
"r": 398.5,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 441.0,
"t": 449.5,
"r": 445.4,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.8,
"t": 449.5,
"r": 492.2,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 318.8,
"t": 473.7,
"r": 323.2,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "8 2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.2,
"t": 461.8,
"r": 351.6,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 461.8,
"r": 402.9,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "10",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 441.0,
"t": 461.8,
"r": 449.4,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "11",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.8,
"t": 461.8,
"r": 496.6,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "12",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.2,
"t": 473.7,
"r": 356.0,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "13",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 473.7,
"r": 402.9,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "14",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 441.0,
"t": 473.7,
"r": 449.7,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "15",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.8,
"t": 473.7,
"r": 496.6,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "16",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.2,
"t": 485.1,
"r": 356.0,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "17",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 485.1,
"r": 402.9,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "18",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 441.0,
"t": 485.1,
"r": 449.7,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "19",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.8,
"t": 485.1,
"r": 496.6,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "20",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
"15": {
"label": "table",
"id": 15,
"page_no": 0,
"cluster": {
"id": 15,
"label": "table",
"bbox": {
"l": 315.7,
"t": 228.7,
"r": 537.1,
"b": 302.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.65,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.9,
"r_y0": 245.5,
"r_x1": 458.0,
"r_y1": 245.5,
"r_x2": 458.0,
"r_y2": 235.3,
"r_x3": 451.9,
"r_y3": 235.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.5,
"r_x1": 337.2,
"r_y1": 279.5,
"r_x2": 337.2,
"r_y2": 269.4,
"r_x3": 331.2,
"r_y3": 269.4,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.0,
"r_y0": 262.8,
"r_x1": 390.0,
"r_y1": 262.8,
"r_x2": 390.0,
"r_y2": 252.7,
"r_x3": 384.0,
"r_y3": 252.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 83,
"label": "text",
"bbox": {
"l": 451.9,
"t": 235.3,
"r": 458.0,
"b": 245.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.9,
"r_y0": 245.5,
"r_x1": 458.0,
"r_y1": 245.5,
"r_x2": 458.0,
"r_y2": 235.3,
"r_x3": 451.9,
"r_y3": 235.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 331.2,
"t": 269.4,
"r": 337.2,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.5,
"r_x1": 337.2,
"r_y1": 279.5,
"r_x2": 337.2,
"r_y2": 269.4,
"r_x3": 331.2,
"r_y3": 269.4,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 384.0,
"t": 252.7,
"r": 390.0,
"b": 262.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.0,
"r_y0": 262.8,
"r_x1": 390.0,
"r_y1": 262.8,
"r_x2": 390.0,
"r_y2": 252.7,
"r_x3": 384.0,
"r_y3": 252.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"ucel",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"ucel",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 1,
"num_cols": 1,
"table_cells": [
{
"bbox": {
"l": 451.9,
"t": 235.3,
"r": 458.0,
"b": 245.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "1",
"column_header": true,
"row_header": false,
"row_section": false
}
]
}
}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "section_header",
"id": 8,
"page_no": 0,
"cluster": {
"id": 8,
"label": "section_header",
"bbox": {
"l": 96.3,
"t": 107.0,
"r": 498.9,
"b": 119.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 96.3,
"r_y0": 119.9,
"r_x1": 498.9,
"r_y1": 119.9,
"r_x2": 498.9,
"r_y2": 107.0,
"r_x3": 96.3,
"r_y3": 107.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer: Table Structure Understanding with Transformers.",
"orig": "TableFormer: Table Structure Understanding with Transformers.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TableFormer: Table Structure Understanding with Transformers."
},
{
"label": "section_header",
"id": 13,
"page_no": 0,
"cluster": {
"id": 13,
"label": "section_header",
"bbox": {
"l": 142.5,
"t": 146.7,
"r": 452.8,
"b": 171.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.76,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 142.5,
"r_y0": 157.4,
"r_x1": 452.8,
"r_y1": 157.4,
"r_x2": 452.8,
"r_y2": 146.7,
"r_x3": 142.5,
"r_y3": 146.7,
"coord_origin": "TOPLEFT"
},
"text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar",
"orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.9,
"r_y0": 171.3,
"r_x1": 332.3,
"r_y1": 171.3,
"r_x2": 332.3,
"r_y2": 160.6,
"r_x3": 262.9,
"r_y3": 160.6,
"coord_origin": "TOPLEFT"
},
"text": "IBM Research",
"orig": "IBM Research",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar IBM Research"
},
{
"label": "key_value_region",
"id": 25,
"page_no": 0,
"cluster": {
"id": 25,
"label": "key_value_region",
"bbox": {
"l": 208.1,
"t": 176.0,
"r": 378.7,
"b": 184.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.49,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.1,
"r_y0": 184.4,
"r_x1": 212.7,
"r_y1": 184.4,
"r_x2": 212.7,
"r_y2": 176.0,
"r_x3": 208.1,
"r_y3": 176.0,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 212.7,
"r_y0": 184.0,
"r_x1": 293.4,
"r_y1": 184.0,
"r_x2": 293.4,
"r_y2": 177.1,
"r_x3": 212.7,
"r_y3": 177.1,
"coord_origin": "TOPLEFT"
},
"text": "ahn,nli,mly,taa",
"orig": "ahn,nli,mly,taa",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 293.4,
"r_y0": 184.4,
"r_x1": 298.0,
"r_y1": 184.4,
"r_x2": 298.0,
"r_y2": 176.0,
"r_x3": 293.4,
"r_y3": 176.0,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 298.0,
"r_y0": 184.0,
"r_x1": 378.7,
"r_y1": 184.0,
"r_x2": 378.7,
"r_y2": 177.1,
"r_x3": 298.0,
"r_y3": 177.1,
"coord_origin": "TOPLEFT"
},
"text": "@zurich.ibm.com",
"orig": "@zurich.ibm.com",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 7,
"label": "text",
"bbox": {
"l": 208.1,
"t": 176.0,
"r": 378.7,
"b": 184.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.1,
"r_y0": 184.4,
"r_x1": 212.7,
"r_y1": 184.4,
"r_x2": 212.7,
"r_y2": 176.0,
"r_x3": 208.1,
"r_y3": 176.0,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 212.7,
"r_y0": 184.0,
"r_x1": 293.4,
"r_y1": 184.0,
"r_x2": 293.4,
"r_y2": 177.1,
"r_x3": 212.7,
"r_y3": 177.1,
"coord_origin": "TOPLEFT"
},
"text": "ahn,nli,mly,taa",
"orig": "ahn,nli,mly,taa",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 293.4,
"r_y0": 184.4,
"r_x1": 298.0,
"r_y1": 184.4,
"r_x2": 298.0,
"r_y2": 176.0,
"r_x3": 293.4,
"r_y3": 176.0,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 298.0,
"r_y0": 184.0,
"r_x1": 378.7,
"r_y1": 184.0,
"r_x2": 378.7,
"r_y2": 177.1,
"r_x3": 298.0,
"r_y3": 177.1,
"coord_origin": "TOPLEFT"
},
"text": "@zurich.ibm.com",
"orig": "@zurich.ibm.com",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null
},
{
"label": "section_header",
"id": 5,
"page_no": 0,
"cluster": {
"id": 5,
"label": "section_header",
"bbox": {
"l": 146.0,
"t": 215.5,
"r": 190.5,
"b": 226.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 146.0,
"r_y0": 226.2,
"r_x1": 190.5,
"r_y1": 226.2,
"r_x2": 190.5,
"r_y2": 215.5,
"r_x3": 146.0,
"r_y3": 215.5,
"coord_origin": "TOPLEFT"
},
"text": "Abstract",
"orig": "Abstract",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Abstract"
},
{
"label": "text",
"id": 2,
"page_no": 0,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 50.1,
"t": 241.4,
"r": 286.4,
"b": 513.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 250.0,
"r_x1": 286.4,
"r_y1": 250.0,
"r_x2": 286.4,
"r_y2": 241.4,
"r_x3": 62.1,
"r_y3": 241.4,
"coord_origin": "TOPLEFT"
},
"text": "Tables organize valuable content in a concise and com-",
"orig": "Tables organize valuable content in a concise and com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 261.9,
"r_x1": 286.4,
"r_y1": 261.9,
"r_x2": 286.4,
"r_y2": 253.4,
"r_x3": 50.1,
"r_y3": 253.4,
"coord_origin": "TOPLEFT"
},
"text": "pact representation. This content is extremely valuable for",
"orig": "pact representation. This content is extremely valuable for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 273.9,
"r_x1": 286.4,
"r_y1": 273.9,
"r_x2": 286.4,
"r_y2": 265.3,
"r_x3": 50.1,
"r_y3": 265.3,
"coord_origin": "TOPLEFT"
},
"text": "systems such as search engines, Knowledge Graph\u2019s, etc,",
"orig": "systems such as search engines, Knowledge Graph\u2019s, etc,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 285.8,
"r_x1": 286.4,
"r_y1": 285.8,
"r_x2": 286.4,
"r_y2": 277.3,
"r_x3": 50.1,
"r_y3": 277.3,
"coord_origin": "TOPLEFT"
},
"text": "since they enhance their predictive capabilities. Unfortu-",
"orig": "since they enhance their predictive capabilities. Unfortu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 297.8,
"r_x1": 286.4,
"r_y1": 297.8,
"r_x2": 286.4,
"r_y2": 289.2,
"r_x3": 50.1,
"r_y3": 289.2,
"coord_origin": "TOPLEFT"
},
"text": "nately, tables come in a large variety of shapes and sizes.",
"orig": "nately, tables come in a large variety of shapes and sizes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 309.8,
"r_x1": 286.4,
"r_y1": 309.8,
"r_x2": 286.4,
"r_y2": 301.2,
"r_x3": 50.1,
"r_y3": 301.2,
"coord_origin": "TOPLEFT"
},
"text": "Furthermore, they can have complex column/row-header",
"orig": "Furthermore, they can have complex column/row-header",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 321.7,
"r_x1": 286.4,
"r_y1": 321.7,
"r_x2": 286.4,
"r_y2": 313.1,
"r_x3": 50.1,
"r_y3": 313.1,
"coord_origin": "TOPLEFT"
},
"text": "configurations, multiline rows, different variety of separa-",
"orig": "configurations, multiline rows, different variety of separa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 333.7,
"r_x1": 286.4,
"r_y1": 333.7,
"r_x2": 286.4,
"r_y2": 325.1,
"r_x3": 50.1,
"r_y3": 325.1,
"coord_origin": "TOPLEFT"
},
"text": "tion lines, missing entries, etc. As such, the correct iden-",
"orig": "tion lines, missing entries, etc. As such, the correct iden-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 345.6,
"r_x1": 286.4,
"r_y1": 345.6,
"r_x2": 286.4,
"r_y2": 337.0,
"r_x3": 50.1,
"r_y3": 337.0,
"coord_origin": "TOPLEFT"
},
"text": "tification of the table-structure from an image is a non-",
"orig": "tification of the table-structure from an image is a non-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 357.6,
"r_x1": 286.4,
"r_y1": 357.6,
"r_x2": 286.4,
"r_y2": 349.0,
"r_x3": 50.1,
"r_y3": 349.0,
"coord_origin": "TOPLEFT"
},
"text": "trivial task. In this paper, we present a new table-structure",
"orig": "trivial task. In this paper, we present a new table-structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 369.5,
"r_x1": 286.4,
"r_y1": 369.5,
"r_x2": 286.4,
"r_y2": 360.9,
"r_x3": 50.1,
"r_y3": 360.9,
"coord_origin": "TOPLEFT"
},
"text": "identification model. The latter improves the latest end-to-",
"orig": "identification model. The latter improves the latest end-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 381.5,
"r_x1": 286.4,
"r_y1": 381.5,
"r_x2": 286.4,
"r_y2": 372.9,
"r_x3": 50.1,
"r_y3": 372.9,
"coord_origin": "TOPLEFT"
},
"text": "end deep learning model (i.e. encoder-dual-decoder from",
"orig": "end deep learning model (i.e. encoder-dual-decoder from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 393.4,
"r_x1": 286.4,
"r_y1": 393.4,
"r_x2": 286.4,
"r_y2": 384.9,
"r_x3": 50.1,
"r_y3": 384.9,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet) in two significant ways. First, we introduce a",
"orig": "PubTabNet) in two significant ways. First, we introduce a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 405.4,
"r_x1": 286.4,
"r_y1": 405.4,
"r_x2": 286.4,
"r_y2": 396.8,
"r_x3": 50.1,
"r_y3": 396.8,
"coord_origin": "TOPLEFT"
},
"text": "new object detection decoder for table-cells. In this way,",
"orig": "new object detection decoder for table-cells. In this way,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 417.4,
"r_x1": 286.4,
"r_y1": 417.4,
"r_x2": 286.4,
"r_y2": 408.8,
"r_x3": 50.1,
"r_y3": 408.8,
"coord_origin": "TOPLEFT"
},
"text": "we can obtain the content of the table-cells from program-",
"orig": "we can obtain the content of the table-cells from program-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 429.3,
"r_x1": 286.4,
"r_y1": 429.3,
"r_x2": 286.4,
"r_y2": 420.7,
"r_x3": 50.1,
"r_y3": 420.7,
"coord_origin": "TOPLEFT"
},
"text": "matic PDF\u2019s directly from the PDF source and avoid the",
"orig": "matic PDF\u2019s directly from the PDF source and avoid the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 441.3,
"r_x1": 207.2,
"r_y1": 441.3,
"r_x2": 207.2,
"r_y2": 432.7,
"r_x3": 50.1,
"r_y3": 432.7,
"coord_origin": "TOPLEFT"
},
"text": "training of the custom OCR decoders.",
"orig": "training of the custom OCR decoders.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 214.1,
"r_y0": 441.3,
"r_x1": 286.4,
"r_y1": 441.3,
"r_x2": 286.4,
"r_y2": 432.7,
"r_x3": 214.1,
"r_y3": 432.7,
"coord_origin": "TOPLEFT"
},
"text": "This architectural",
"orig": "This architectural",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 453.2,
"r_x1": 286.4,
"r_y1": 453.2,
"r_x2": 286.4,
"r_y2": 444.6,
"r_x3": 50.1,
"r_y3": 444.6,
"coord_origin": "TOPLEFT"
},
"text": "change leads to more accurate table-content extraction and",
"orig": "change leads to more accurate table-content extraction and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 465.2,
"r_x1": 286.4,
"r_y1": 465.2,
"r_x2": 286.4,
"r_y2": 456.6,
"r_x3": 50.1,
"r_y3": 456.6,
"coord_origin": "TOPLEFT"
},
"text": "allows us to tackle non-english tables. Second, we replace",
"orig": "allows us to tackle non-english tables. Second, we replace",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 477.1,
"r_x1": 286.4,
"r_y1": 477.1,
"r_x2": 286.4,
"r_y2": 468.5,
"r_x3": 50.1,
"r_y3": 468.5,
"coord_origin": "TOPLEFT"
},
"text": "the LSTM decoders with transformer based decoders. This",
"orig": "the LSTM decoders with transformer based decoders. This",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 489.1,
"r_x1": 286.4,
"r_y1": 489.1,
"r_x2": 286.4,
"r_y2": 480.5,
"r_x3": 50.1,
"r_y3": 480.5,
"coord_origin": "TOPLEFT"
},
"text": "upgrade improves significantly the previous state-of-the-art",
"orig": "upgrade improves significantly the previous state-of-the-art",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 501.0,
"r_x1": 286.4,
"r_y1": 501.0,
"r_x2": 286.4,
"r_y2": 492.5,
"r_x3": 50.1,
"r_y3": 492.5,
"coord_origin": "TOPLEFT"
},
"text": "tree-editing-distance-score (TEDS) from 91% to 98.5% on",
"orig": "tree-editing-distance-score (TEDS) from 91% to 98.5% on",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 513.0,
"r_x1": 276.7,
"r_y1": 513.0,
"r_x2": 276.7,
"r_y2": 504.4,
"r_x3": 50.1,
"r_y3": 504.4,
"coord_origin": "TOPLEFT"
},
"text": "simple tables and from 88.7% to 95% on complex tables.",
"orig": "simple tables and from 88.7% to 95% on complex tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Tables organize valuable content in a concise and compact representation. This content is extremely valuable for systems such as search engines, Knowledge Graph's, etc, since they enhance their predictive capabilities. Unfortunately, tables come in a large variety of shapes and sizes. Furthermore, they can have complex column/row-header configurations, multiline rows, different variety of separation lines, missing entries, etc. As such, the correct identification of the table-structure from an image is a nontrivial task. In this paper, we present a new table-structure identification model. The latter improves the latest end-toend deep learning model (i.e. encoder-dual-decoder from PubTabNet) in two significant ways. First, we introduce a new object detection decoder for table-cells. In this way, we can obtain the content of the table-cells from programmatic PDF's directly from the PDF source and avoid the training of the custom OCR decoders. This architectural change leads to more accurate table-content extraction and allows us to tackle non-english tables. Second, we replace the LSTM decoders with transformer based decoders. This upgrade improves significantly the previous state-of-the-art tree-editing-distance-score (TEDS) from 91% to 98.5% on simple tables and from 88.7% to 95% on complex tables."
},
{
"label": "section_header",
"id": 4,
"page_no": 0,
"cluster": {
"id": 4,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 539.9,
"r": 126.9,
"b": 550.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 550.7,
"r_x1": 58.1,
"r_y1": 550.7,
"r_x2": 58.1,
"r_y2": 539.9,
"r_x3": 50.1,
"r_y3": 539.9,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.8,
"r_y0": 550.7,
"r_x1": 126.9,
"r_y1": 550.7,
"r_x2": 126.9,
"r_y2": 539.9,
"r_x3": 68.8,
"r_y3": 539.9,
"coord_origin": "TOPLEFT"
},
"text": "Introduction",
"orig": "Introduction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1. Introduction"
},
{
"label": "text",
"id": 1,
"page_no": 0,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.1,
"t": 560.8,
"r": 286.4,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 569.7,
"r_x1": 286.4,
"r_y1": 569.7,
"r_x2": 286.4,
"r_y2": 560.8,
"r_x3": 62.1,
"r_y3": 560.8,
"coord_origin": "TOPLEFT"
},
"text": "The occurrence of tables in documents is ubiquitous.",
"orig": "The occurrence of tables in documents is ubiquitous.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 581.6,
"r_x1": 286.4,
"r_y1": 581.6,
"r_x2": 286.4,
"r_y2": 572.7,
"r_x3": 50.1,
"r_y3": 572.7,
"coord_origin": "TOPLEFT"
},
"text": "They often summarise quantitative or factual data, which is",
"orig": "They often summarise quantitative or factual data, which is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 593.6,
"r_x1": 286.4,
"r_y1": 593.6,
"r_x2": 286.4,
"r_y2": 584.7,
"r_x3": 50.1,
"r_y3": 584.7,
"coord_origin": "TOPLEFT"
},
"text": "cumbersome to describe in verbose text but nevertheless ex-",
"orig": "cumbersome to describe in verbose text but nevertheless ex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 605.6,
"r_x1": 286.4,
"r_y1": 605.6,
"r_x2": 286.4,
"r_y2": 596.6,
"r_x3": 50.1,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "tremely valuable. Unfortunately, this compact representa-",
"orig": "tremely valuable. Unfortunately, this compact representa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 617.5,
"r_x1": 286.4,
"r_y1": 617.5,
"r_x2": 286.4,
"r_y2": 608.6,
"r_x3": 50.1,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "tion is often not easy to parse by machines. There are many",
"orig": "tion is often not easy to parse by machines. There are many",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 629.5,
"r_x1": 286.4,
"r_y1": 629.5,
"r_x2": 286.4,
"r_y2": 620.6,
"r_x3": 50.1,
"r_y3": 620.6,
"coord_origin": "TOPLEFT"
},
"text": "implicit conventions used to obtain a compact table repre-",
"orig": "implicit conventions used to obtain a compact table repre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 641.4,
"r_x1": 286.4,
"r_y1": 641.4,
"r_x2": 286.4,
"r_y2": 632.5,
"r_x3": 50.1,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": "sentation. For example, tables often have complex column-",
"orig": "sentation. For example, tables often have complex column-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 653.4,
"r_x1": 286.4,
"r_y1": 653.4,
"r_x2": 286.4,
"r_y2": 644.5,
"r_x3": 50.1,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "and row-headers in order to reduce duplicated cell content.",
"orig": "and row-headers in order to reduce duplicated cell content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 665.3,
"r_x1": 286.4,
"r_y1": 665.3,
"r_x2": 286.4,
"r_y2": 656.4,
"r_x3": 50.1,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "Lines of different shapes and sizes are leveraged to separate",
"orig": "Lines of different shapes and sizes are leveraged to separate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.3,
"r_x1": 286.4,
"r_y1": 677.3,
"r_x2": 286.4,
"r_y2": 668.4,
"r_x3": 50.1,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "content or indicate a tree structure. Additionally, tables can",
"orig": "content or indicate a tree structure. Additionally, tables can",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 689.2,
"r_x1": 286.4,
"r_y1": 689.2,
"r_x2": 286.4,
"r_y2": 680.3,
"r_x3": 50.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "also have empty/missing table-entries or multi-row textual",
"orig": "also have empty/missing table-entries or multi-row textual",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "table-entries. Fig. 1 shows a table which presents all these",
"orig": "table-entries. Fig. 1 shows a table which presents all these",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 76.4,
"r_y1": 713.2,
"r_x2": 76.4,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "issues.",
"orig": "issues.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The occurrence of tables in documents is ubiquitous. They often summarise quantitative or factual data, which is cumbersome to describe in verbose text but nevertheless extremely valuable. Unfortunately, this compact representation is often not easy to parse by machines. There are many implicit conventions used to obtain a compact table representation. For example, tables often have complex columnand row-headers in order to reduce duplicated cell content. Lines of different shapes and sizes are leveraged to separate content or indicate a tree structure. Additionally, tables can also have empty/missing table-entries or multi-row textual table-entries. Fig. 1 shows a table which presents all these issues."
},
{
"label": "section_header",
"id": 14,
"page_no": 0,
"cluster": {
"id": 14,
"label": "section_header",
"bbox": {
"l": 315.6,
"t": 218.0,
"r": 408.4,
"b": 226.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.67,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.6,
"r_y0": 226.8,
"r_x1": 324.0,
"r_y1": 226.8,
"r_x2": 324.0,
"r_y2": 218.0,
"r_x3": 315.6,
"r_y3": 218.0,
"coord_origin": "TOPLEFT"
},
"text": "a.",
"orig": "a.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.2,
"r_y0": 226.8,
"r_x1": 408.4,
"r_y1": 226.8,
"r_x2": 408.4,
"r_y2": 218.0,
"r_x3": 328.2,
"r_y3": 218.0,
"coord_origin": "TOPLEFT"
},
"text": "Picture of a table:",
"orig": "Picture of a table:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "a. Picture of a table:"
},
{
"label": "list_item",
"id": 17,
"page_no": 0,
"cluster": {
"id": 17,
"label": "list_item",
"bbox": {
"l": 315.6,
"t": 313.7,
"r": 486.4,
"b": 333.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.6,
"r_y0": 322.4,
"r_x1": 325.1,
"r_y1": 322.4,
"r_x2": 325.1,
"r_y2": 313.7,
"r_x3": 315.6,
"r_y3": 313.7,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.8,
"r_y0": 322.4,
"r_x1": 486.4,
"r_y1": 322.4,
"r_x2": 486.4,
"r_y2": 313.7,
"r_x3": 329.8,
"r_y3": 313.7,
"coord_origin": "TOPLEFT"
},
"text": "Red-annotation of bounding boxes,",
"orig": "Red-annotation of bounding boxes,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.5,
"r_y0": 333.2,
"r_x1": 472.5,
"r_y1": 333.2,
"r_x2": 472.5,
"r_y2": 324.5,
"r_x3": 326.5,
"r_y3": 324.5,
"coord_origin": "TOPLEFT"
},
"text": "Blue-predictions by TableFormer",
"orig": "Blue-predictions by TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "b. Red-annotation of bounding boxes, Blue-predictions by TableFormer"
},
{
"label": "list_item",
"id": 18,
"page_no": 0,
"cluster": {
"id": 18,
"label": "list_item",
"bbox": {
"l": 315.6,
"t": 420.2,
"r": 491.2,
"b": 428.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.6,
"r_y0": 428.9,
"r_x1": 324.8,
"r_y1": 428.9,
"r_x2": 324.8,
"r_y2": 420.2,
"r_x3": 315.6,
"r_y3": 420.2,
"coord_origin": "TOPLEFT"
},
"text": "c.",
"orig": "c.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.4,
"r_y0": 428.9,
"r_x1": 491.2,
"r_y1": 428.9,
"r_x2": 491.2,
"r_y2": 420.2,
"r_x3": 329.4,
"r_y3": 420.2,
"coord_origin": "TOPLEFT"
},
"text": "Structure predicted by TableFormer:",
"orig": "Structure predicted by TableFormer:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "c. Structure predicted by TableFormer:"
},
{
"label": "picture",
"id": 10,
"page_no": 0,
"cluster": {
"id": 10,
"label": "picture",
"bbox": {
"l": 314.8,
"t": 338.1,
"r": 539.2,
"b": 410.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.87,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.1,
"r_y0": 351.6,
"r_x1": 412.5,
"r_y1": 351.6,
"r_x2": 412.5,
"r_y2": 342.8,
"r_x3": 408.1,
"r_y3": 342.8,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.1,
"r_y0": 350.4,
"r_x1": 360.5,
"r_y1": 350.4,
"r_x2": 360.5,
"r_y2": 341.6,
"r_x3": 356.1,
"r_y3": 341.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.7,
"r_y0": 349.7,
"r_x1": 505.1,
"r_y1": 349.7,
"r_x2": 505.1,
"r_y2": 340.9,
"r_x3": 500.7,
"r_y3": 340.9,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.1,
"r_y0": 360.5,
"r_x1": 360.5,
"r_y1": 360.5,
"r_x2": 360.5,
"r_y2": 351.7,
"r_x3": 356.1,
"r_y3": 351.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 402.5,
"r_y0": 364.7,
"r_x1": 406.9,
"r_y1": 364.7,
"r_x2": 406.9,
"r_y2": 355.9,
"r_x3": 402.5,
"r_y3": 355.9,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.6,
"r_y0": 361.6,
"r_x1": 453.0,
"r_y1": 361.6,
"r_x2": 453.0,
"r_y2": 352.8,
"r_x3": 448.6,
"r_y3": 352.8,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 491.7,
"r_y0": 362.5,
"r_x1": 496.0,
"r_y1": 362.5,
"r_x2": 496.0,
"r_y2": 353.7,
"r_x3": 491.7,
"r_y3": 353.7,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 535.1,
"r_y0": 362.1,
"r_x1": 539.5,
"r_y1": 362.1,
"r_x2": 539.5,
"r_y2": 353.3,
"r_x3": 535.1,
"r_y3": 353.3,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.8,
"r_y0": 395.9,
"r_x1": 353.2,
"r_y1": 395.9,
"r_x2": 353.2,
"r_y2": 387.1,
"r_x3": 348.8,
"r_y3": 387.1,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.3,
"r_y0": 384.2,
"r_x1": 393.7,
"r_y1": 384.2,
"r_x2": 393.7,
"r_y2": 375.4,
"r_x3": 389.3,
"r_y3": 375.4,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.7,
"r_y0": 384.4,
"r_x1": 451.5,
"r_y1": 384.4,
"r_x2": 451.5,
"r_y2": 375.6,
"r_x3": 442.7,
"r_y3": 375.6,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.4,
"r_y0": 384.3,
"r_x1": 485.9,
"r_y1": 384.3,
"r_x2": 485.9,
"r_y2": 375.5,
"r_x3": 477.4,
"r_y3": 375.5,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 522.6,
"r_y0": 384.4,
"r_x1": 531.4,
"r_y1": 384.4,
"r_x2": 531.4,
"r_y2": 375.6,
"r_x3": 522.6,
"r_y3": 375.6,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.2,
"r_y0": 395.9,
"r_x1": 409.0,
"r_y1": 395.9,
"r_x2": 409.0,
"r_y2": 387.1,
"r_x3": 400.2,
"r_y3": 387.1,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.3,
"r_y0": 395.8,
"r_x1": 451.1,
"r_y1": 395.8,
"r_x2": 451.1,
"r_y2": 387.0,
"r_x3": 442.3,
"r_y3": 387.0,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.2,
"r_y0": 396.2,
"r_x1": 487.0,
"r_y1": 396.2,
"r_x2": 487.0,
"r_y2": 387.4,
"r_x3": 478.2,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 523.2,
"r_y0": 395.8,
"r_x1": 532.0,
"r_y1": 395.8,
"r_x2": 532.0,
"r_y2": 387.0,
"r_x3": 523.2,
"r_y3": 387.0,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.6,
"r_y0": 408.2,
"r_x1": 416.0,
"r_y1": 408.2,
"r_x2": 416.0,
"r_y2": 399.4,
"r_x3": 411.6,
"r_y3": 399.4,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 416.0,
"r_y0": 408.2,
"r_x1": 420.4,
"r_y1": 408.2,
"r_x2": 420.4,
"r_y2": 399.4,
"r_x3": 416.0,
"r_y3": 399.4,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.3,
"r_y0": 407.8,
"r_x1": 451.1,
"r_y1": 407.8,
"r_x2": 451.1,
"r_y2": 399.0,
"r_x3": 442.3,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.8,
"r_y0": 407.8,
"r_x1": 487.6,
"r_y1": 407.8,
"r_x2": 487.6,
"r_y2": 399.0,
"r_x3": 478.8,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 524.0,
"r_y0": 407.4,
"r_x1": 532.8,
"r_y1": 407.4,
"r_x2": 532.8,
"r_y2": 398.6,
"r_x3": 524.0,
"r_y3": 398.6,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.1,
"r_y0": 367.9,
"r_x1": 391.1,
"r_y1": 367.9,
"r_x2": 391.1,
"r_y2": 357.8,
"r_x3": 385.1,
"r_y3": 357.8,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.4,
"r_y0": 390.9,
"r_x1": 339.4,
"r_y1": 390.9,
"r_x2": 339.4,
"r_y2": 380.7,
"r_x3": 333.4,
"r_y3": 380.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.1,
"r_y0": 351.2,
"r_x1": 484.1,
"r_y1": 351.2,
"r_x2": 484.1,
"r_y2": 341.0,
"r_x3": 478.1,
"r_y3": 341.0,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 40,
"label": "text",
"bbox": {
"l": 408.1,
"t": 342.8,
"r": 412.5,
"b": 351.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.1,
"r_y0": 351.6,
"r_x1": 412.5,
"r_y1": 351.6,
"r_x2": 412.5,
"r_y2": 342.8,
"r_x3": 408.1,
"r_y3": 342.8,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 356.1,
"t": 341.6,
"r": 360.5,
"b": 350.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.1,
"r_y0": 350.4,
"r_x1": 360.5,
"r_y1": 350.4,
"r_x2": 360.5,
"r_y2": 341.6,
"r_x3": 356.1,
"r_y3": 341.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 500.7,
"t": 340.9,
"r": 505.1,
"b": 349.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.7,
"r_y0": 349.7,
"r_x1": 505.1,
"r_y1": 349.7,
"r_x2": 505.1,
"r_y2": 340.9,
"r_x3": 500.7,
"r_y3": 340.9,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 356.1,
"t": 351.7,
"r": 360.5,
"b": 360.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.1,
"r_y0": 360.5,
"r_x1": 360.5,
"r_y1": 360.5,
"r_x2": 360.5,
"r_y2": 351.7,
"r_x3": 356.1,
"r_y3": 351.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 402.5,
"t": 355.9,
"r": 406.9,
"b": 364.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 402.5,
"r_y0": 364.7,
"r_x1": 406.9,
"r_y1": 364.7,
"r_x2": 406.9,
"r_y2": 355.9,
"r_x3": 402.5,
"r_y3": 355.9,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 448.6,
"t": 352.8,
"r": 453.0,
"b": 361.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.6,
"r_y0": 361.6,
"r_x1": 453.0,
"r_y1": 361.6,
"r_x2": 453.0,
"r_y2": 352.8,
"r_x3": 448.6,
"r_y3": 352.8,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 491.7,
"t": 353.7,
"r": 496.0,
"b": 362.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 491.7,
"r_y0": 362.5,
"r_x1": 496.0,
"r_y1": 362.5,
"r_x2": 496.0,
"r_y2": 353.7,
"r_x3": 491.7,
"r_y3": 353.7,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 535.1,
"t": 353.3,
"r": 539.5,
"b": 362.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 535.1,
"r_y0": 362.1,
"r_x1": 539.5,
"r_y1": 362.1,
"r_x2": 539.5,
"r_y2": 353.3,
"r_x3": 535.1,
"r_y3": 353.3,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 348.8,
"t": 387.1,
"r": 353.2,
"b": 395.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.8,
"r_y0": 395.9,
"r_x1": 353.2,
"r_y1": 395.9,
"r_x2": 353.2,
"r_y2": 387.1,
"r_x3": 348.8,
"r_y3": 387.1,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 389.3,
"t": 375.4,
"r": 393.7,
"b": 384.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.3,
"r_y0": 384.2,
"r_x1": 393.7,
"r_y1": 384.2,
"r_x2": 393.7,
"r_y2": 375.4,
"r_x3": 389.3,
"r_y3": 375.4,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 442.7,
"t": 375.6,
"r": 451.5,
"b": 384.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.7,
"r_y0": 384.4,
"r_x1": 451.5,
"r_y1": 384.4,
"r_x2": 451.5,
"r_y2": 375.6,
"r_x3": 442.7,
"r_y3": 375.6,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 51,
"label": "text",
"bbox": {
"l": 477.4,
"t": 375.5,
"r": 485.9,
"b": 384.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.4,
"r_y0": 384.3,
"r_x1": 485.9,
"r_y1": 384.3,
"r_x2": 485.9,
"r_y2": 375.5,
"r_x3": 477.4,
"r_y3": 375.5,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 52,
"label": "text",
"bbox": {
"l": 522.6,
"t": 375.6,
"r": 531.4,
"b": 384.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 522.6,
"r_y0": 384.4,
"r_x1": 531.4,
"r_y1": 384.4,
"r_x2": 531.4,
"r_y2": 375.6,
"r_x3": 522.6,
"r_y3": 375.6,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 53,
"label": "text",
"bbox": {
"l": 400.2,
"t": 387.1,
"r": 409.0,
"b": 395.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.2,
"r_y0": 395.9,
"r_x1": 409.0,
"r_y1": 395.9,
"r_x2": 409.0,
"r_y2": 387.1,
"r_x3": 400.2,
"r_y3": 387.1,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 54,
"label": "text",
"bbox": {
"l": 442.3,
"t": 387.0,
"r": 451.1,
"b": 395.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.3,
"r_y0": 395.8,
"r_x1": 451.1,
"r_y1": 395.8,
"r_x2": 451.1,
"r_y2": 387.0,
"r_x3": 442.3,
"r_y3": 387.0,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 55,
"label": "text",
"bbox": {
"l": 478.2,
"t": 387.4,
"r": 487.0,
"b": 396.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.2,
"r_y0": 396.2,
"r_x1": 487.0,
"r_y1": 396.2,
"r_x2": 487.0,
"r_y2": 387.4,
"r_x3": 478.2,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 523.2,
"t": 387.0,
"r": 532.0,
"b": 395.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 523.2,
"r_y0": 395.8,
"r_x1": 532.0,
"r_y1": 395.8,
"r_x2": 532.0,
"r_y2": 387.0,
"r_x3": 523.2,
"r_y3": 387.0,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 411.6,
"t": 399.4,
"r": 416.0,
"b": 408.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.6,
"r_y0": 408.2,
"r_x1": 416.0,
"r_y1": 408.2,
"r_x2": 416.0,
"r_y2": 399.4,
"r_x3": 411.6,
"r_y3": 399.4,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 416.0,
"t": 399.4,
"r": 420.4,
"b": 408.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 416.0,
"r_y0": 408.2,
"r_x1": 420.4,
"r_y1": 408.2,
"r_x2": 420.4,
"r_y2": 399.4,
"r_x3": 416.0,
"r_y3": 399.4,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 442.3,
"t": 399.0,
"r": 451.1,
"b": 407.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.3,
"r_y0": 407.8,
"r_x1": 451.1,
"r_y1": 407.8,
"r_x2": 451.1,
"r_y2": 399.0,
"r_x3": 442.3,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 478.8,
"t": 399.0,
"r": 487.6,
"b": 407.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.8,
"r_y0": 407.8,
"r_x1": 487.6,
"r_y1": 407.8,
"r_x2": 487.6,
"r_y2": 399.0,
"r_x3": 478.8,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 524.0,
"t": 398.6,
"r": 532.8,
"b": 407.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 524.0,
"r_y0": 407.4,
"r_x1": 532.8,
"r_y1": 407.4,
"r_x2": 532.8,
"r_y2": 398.6,
"r_x3": 524.0,
"r_y3": 398.6,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 385.1,
"t": 357.8,
"r": 391.1,
"b": 367.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.1,
"r_y0": 367.9,
"r_x1": 391.1,
"r_y1": 367.9,
"r_x2": 391.1,
"r_y2": 357.8,
"r_x3": 385.1,
"r_y3": 357.8,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 333.4,
"t": 380.7,
"r": 339.4,
"b": 390.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.4,
"r_y0": 390.9,
"r_x1": 339.4,
"r_y1": 390.9,
"r_x2": 339.4,
"r_y2": 380.7,
"r_x3": 333.4,
"r_y3": 380.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 478.1,
"t": 341.0,
"r": 484.1,
"b": 351.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.1,
"r_y0": 351.2,
"r_x1": 484.1,
"r_y1": 351.2,
"r_x2": 484.1,
"r_y2": 341.0,
"r_x3": 478.1,
"r_y3": 341.0,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 23,
"page_no": 0,
"cluster": {
"id": 23,
"label": "picture",
"bbox": {
"l": 315.7,
"t": 433.8,
"r": 536.8,
"b": 496.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.51,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 446.5,
"r_x1": 351.6,
"r_y1": 446.5,
"r_x2": 351.6,
"r_y2": 437.7,
"r_x3": 347.2,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.9,
"r_y0": 446.5,
"r_x1": 323.3,
"r_y1": 446.5,
"r_x2": 323.3,
"r_y2": 437.7,
"r_x3": 318.9,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.5,
"r_x1": 398.5,
"r_y1": 446.5,
"r_x2": 398.5,
"r_y2": 437.7,
"r_x3": 394.1,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 458.3,
"r_x1": 323.2,
"r_y1": 458.3,
"r_x2": 323.2,
"r_y2": 449.5,
"r_x3": 318.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 458.3,
"r_x1": 351.6,
"r_y1": 458.3,
"r_x2": 351.6,
"r_y2": 449.5,
"r_x3": 347.2,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.3,
"r_x1": 398.5,
"r_y1": 458.3,
"r_x2": 398.5,
"r_y2": 449.5,
"r_x3": 394.1,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 458.3,
"r_x1": 445.4,
"r_y1": 458.3,
"r_x2": 445.4,
"r_y2": 449.5,
"r_x3": 441.0,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 458.3,
"r_x1": 492.2,
"r_y1": 458.3,
"r_x2": 492.2,
"r_y2": 449.5,
"r_x3": 487.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 482.5,
"r_x1": 323.2,
"r_y1": 482.5,
"r_x2": 323.2,
"r_y2": 473.7,
"r_x3": 318.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 470.6,
"r_x1": 351.6,
"r_y1": 470.6,
"r_x2": 351.6,
"r_y2": 461.8,
"r_x3": 347.2,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.6,
"r_x1": 402.9,
"r_y1": 470.6,
"r_x2": 402.9,
"r_y2": 461.8,
"r_x3": 394.1,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 470.6,
"r_x1": 449.4,
"r_y1": 470.6,
"r_x2": 449.4,
"r_y2": 461.8,
"r_x3": 441.0,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 470.6,
"r_x1": 496.6,
"r_y1": 470.6,
"r_x2": 496.6,
"r_y2": 461.8,
"r_x3": 487.8,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 482.5,
"r_x1": 356.0,
"r_y1": 482.5,
"r_x2": 356.0,
"r_y2": 473.7,
"r_x3": 347.2,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.5,
"r_x1": 402.9,
"r_y1": 482.5,
"r_x2": 402.9,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 482.5,
"r_x1": 449.7,
"r_y1": 482.5,
"r_x2": 449.7,
"r_y2": 473.7,
"r_x3": 441.0,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 482.5,
"r_x1": 496.6,
"r_y1": 482.5,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 493.9,
"r_x1": 356.0,
"r_y1": 493.9,
"r_x2": 356.0,
"r_y2": 485.1,
"r_x3": 347.2,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.9,
"r_x1": 402.9,
"r_y1": 493.9,
"r_x2": 402.9,
"r_y2": 485.1,
"r_x3": 394.1,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 493.9,
"r_x1": 449.7,
"r_y1": 493.9,
"r_x2": 449.7,
"r_y2": 485.1,
"r_x3": 441.0,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 493.9,
"r_x1": 496.6,
"r_y1": 493.9,
"r_x2": 496.6,
"r_y2": 485.1,
"r_x3": 487.8,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.3,
"r_x1": 372.7,
"r_y1": 459.3,
"r_x2": 372.7,
"r_y2": 449.1,
"r_x3": 366.7,
"r_y3": 449.1,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.5,
"r_x1": 337.9,
"r_y1": 483.5,
"r_x2": 337.9,
"r_y2": 473.3,
"r_x3": 331.9,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.9,
"r_y0": 447.7,
"r_x1": 465.9,
"r_y1": 447.7,
"r_x2": 465.9,
"r_y2": 437.6,
"r_x3": 459.9,
"r_y3": 437.6,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 62,
"label": "text",
"bbox": {
"l": 347.2,
"t": 437.7,
"r": 351.6,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 446.5,
"r_x1": 351.6,
"r_y1": 446.5,
"r_x2": 351.6,
"r_y2": 437.7,
"r_x3": 347.2,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 318.9,
"t": 437.7,
"r": 323.3,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.9,
"r_y0": 446.5,
"r_x1": 323.3,
"r_y1": 446.5,
"r_x2": 323.3,
"r_y2": 437.7,
"r_x3": 318.9,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 394.1,
"t": 437.7,
"r": 398.5,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.5,
"r_x1": 398.5,
"r_y1": 446.5,
"r_x2": 398.5,
"r_y2": 437.7,
"r_x3": 394.1,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 318.8,
"t": 449.5,
"r": 323.2,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 458.3,
"r_x1": 323.2,
"r_y1": 458.3,
"r_x2": 323.2,
"r_y2": 449.5,
"r_x3": 318.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 347.2,
"t": 449.5,
"r": 351.6,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 458.3,
"r_x1": 351.6,
"r_y1": 458.3,
"r_x2": 351.6,
"r_y2": 449.5,
"r_x3": 347.2,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 394.1,
"t": 449.5,
"r": 398.5,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.3,
"r_x1": 398.5,
"r_y1": 458.3,
"r_x2": 398.5,
"r_y2": 449.5,
"r_x3": 394.1,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 441.0,
"t": 449.5,
"r": 445.4,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 458.3,
"r_x1": 445.4,
"r_y1": 458.3,
"r_x2": 445.4,
"r_y2": 449.5,
"r_x3": 441.0,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 487.8,
"t": 449.5,
"r": 492.2,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 458.3,
"r_x1": 492.2,
"r_y1": 458.3,
"r_x2": 492.2,
"r_y2": 449.5,
"r_x3": 487.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 318.8,
"t": 473.7,
"r": 323.2,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 482.5,
"r_x1": 323.2,
"r_y1": 482.5,
"r_x2": 323.2,
"r_y2": 473.7,
"r_x3": 318.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 347.2,
"t": 461.8,
"r": 351.6,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 470.6,
"r_x1": 351.6,
"r_y1": 470.6,
"r_x2": 351.6,
"r_y2": 461.8,
"r_x3": 347.2,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 394.1,
"t": 461.8,
"r": 402.9,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.6,
"r_x1": 402.9,
"r_y1": 470.6,
"r_x2": 402.9,
"r_y2": 461.8,
"r_x3": 394.1,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 441.0,
"t": 461.8,
"r": 449.4,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 470.6,
"r_x1": 449.4,
"r_y1": 470.6,
"r_x2": 449.4,
"r_y2": 461.8,
"r_x3": 441.0,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 487.8,
"t": 461.8,
"r": 496.6,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 470.6,
"r_x1": 496.6,
"r_y1": 470.6,
"r_x2": 496.6,
"r_y2": 461.8,
"r_x3": 487.8,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 347.2,
"t": 473.7,
"r": 356.0,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 482.5,
"r_x1": 356.0,
"r_y1": 482.5,
"r_x2": 356.0,
"r_y2": 473.7,
"r_x3": 347.2,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 394.1,
"t": 473.7,
"r": 402.9,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.5,
"r_x1": 402.9,
"r_y1": 482.5,
"r_x2": 402.9,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 441.0,
"t": 473.7,
"r": 449.7,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 482.5,
"r_x1": 449.7,
"r_y1": 482.5,
"r_x2": 449.7,
"r_y2": 473.7,
"r_x3": 441.0,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 487.8,
"t": 473.7,
"r": 496.6,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 482.5,
"r_x1": 496.6,
"r_y1": 482.5,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 347.2,
"t": 485.1,
"r": 356.0,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 493.9,
"r_x1": 356.0,
"r_y1": 493.9,
"r_x2": 356.0,
"r_y2": 485.1,
"r_x3": 347.2,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 394.1,
"t": 485.1,
"r": 402.9,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.9,
"r_x1": 402.9,
"r_y1": 493.9,
"r_x2": 402.9,
"r_y2": 485.1,
"r_x3": 394.1,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 441.0,
"t": 485.1,
"r": 449.7,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 493.9,
"r_x1": 449.7,
"r_y1": 493.9,
"r_x2": 449.7,
"r_y2": 485.1,
"r_x3": 441.0,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 487.8,
"t": 485.1,
"r": 496.6,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 493.9,
"r_x1": 496.6,
"r_y1": 493.9,
"r_x2": 496.6,
"r_y2": 485.1,
"r_x3": 487.8,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 366.7,
"t": 449.1,
"r": 372.7,
"b": 459.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.3,
"r_x1": 372.7,
"r_y1": 459.3,
"r_x2": 372.7,
"r_y2": 449.1,
"r_x3": 366.7,
"r_y3": 449.1,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 331.9,
"t": 473.3,
"r": 337.9,
"b": 483.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.5,
"r_x1": 337.9,
"r_y1": 483.5,
"r_x2": 337.9,
"r_y2": 473.3,
"r_x3": 331.9,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 459.9,
"t": 437.6,
"r": 465.9,
"b": 447.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.9,
"r_y0": 447.7,
"r_x1": 465.9,
"r_y1": 447.7,
"r_x2": 465.9,
"r_y2": 437.6,
"r_x3": 459.9,
"r_y3": 437.6,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 11,
"page_no": 0,
"cluster": {
"id": 11,
"label": "table",
"bbox": {
"l": 315.7,
"t": 433.8,
"r": 536.8,
"b": 496.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.81,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 446.5,
"r_x1": 351.6,
"r_y1": 446.5,
"r_x2": 351.6,
"r_y2": 437.7,
"r_x3": 347.2,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.9,
"r_y0": 446.5,
"r_x1": 323.3,
"r_y1": 446.5,
"r_x2": 323.3,
"r_y2": 437.7,
"r_x3": 318.9,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.5,
"r_x1": 398.5,
"r_y1": 446.5,
"r_x2": 398.5,
"r_y2": 437.7,
"r_x3": 394.1,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 458.3,
"r_x1": 323.2,
"r_y1": 458.3,
"r_x2": 323.2,
"r_y2": 449.5,
"r_x3": 318.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 458.3,
"r_x1": 351.6,
"r_y1": 458.3,
"r_x2": 351.6,
"r_y2": 449.5,
"r_x3": 347.2,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.3,
"r_x1": 398.5,
"r_y1": 458.3,
"r_x2": 398.5,
"r_y2": 449.5,
"r_x3": 394.1,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 458.3,
"r_x1": 445.4,
"r_y1": 458.3,
"r_x2": 445.4,
"r_y2": 449.5,
"r_x3": 441.0,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 458.3,
"r_x1": 492.2,
"r_y1": 458.3,
"r_x2": 492.2,
"r_y2": 449.5,
"r_x3": 487.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 482.5,
"r_x1": 323.2,
"r_y1": 482.5,
"r_x2": 323.2,
"r_y2": 473.7,
"r_x3": 318.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 470.6,
"r_x1": 351.6,
"r_y1": 470.6,
"r_x2": 351.6,
"r_y2": 461.8,
"r_x3": 347.2,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.6,
"r_x1": 402.9,
"r_y1": 470.6,
"r_x2": 402.9,
"r_y2": 461.8,
"r_x3": 394.1,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 470.6,
"r_x1": 449.4,
"r_y1": 470.6,
"r_x2": 449.4,
"r_y2": 461.8,
"r_x3": 441.0,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 470.6,
"r_x1": 496.6,
"r_y1": 470.6,
"r_x2": 496.6,
"r_y2": 461.8,
"r_x3": 487.8,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 482.5,
"r_x1": 356.0,
"r_y1": 482.5,
"r_x2": 356.0,
"r_y2": 473.7,
"r_x3": 347.2,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.5,
"r_x1": 402.9,
"r_y1": 482.5,
"r_x2": 402.9,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 482.5,
"r_x1": 449.7,
"r_y1": 482.5,
"r_x2": 449.7,
"r_y2": 473.7,
"r_x3": 441.0,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 482.5,
"r_x1": 496.6,
"r_y1": 482.5,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 493.9,
"r_x1": 356.0,
"r_y1": 493.9,
"r_x2": 356.0,
"r_y2": 485.1,
"r_x3": 347.2,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.9,
"r_x1": 402.9,
"r_y1": 493.9,
"r_x2": 402.9,
"r_y2": 485.1,
"r_x3": 394.1,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 493.9,
"r_x1": 449.7,
"r_y1": 493.9,
"r_x2": 449.7,
"r_y2": 485.1,
"r_x3": 441.0,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 493.9,
"r_x1": 496.6,
"r_y1": 493.9,
"r_x2": 496.6,
"r_y2": 485.1,
"r_x3": 487.8,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.3,
"r_x1": 372.7,
"r_y1": 459.3,
"r_x2": 372.7,
"r_y2": 449.1,
"r_x3": 366.7,
"r_y3": 449.1,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.5,
"r_x1": 337.9,
"r_y1": 483.5,
"r_x2": 337.9,
"r_y2": 473.3,
"r_x3": 331.9,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.9,
"r_y0": 447.7,
"r_x1": 465.9,
"r_y1": 447.7,
"r_x2": 465.9,
"r_y2": 437.6,
"r_x3": 459.9,
"r_y3": 437.6,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 62,
"label": "text",
"bbox": {
"l": 347.2,
"t": 437.7,
"r": 351.6,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 446.5,
"r_x1": 351.6,
"r_y1": 446.5,
"r_x2": 351.6,
"r_y2": 437.7,
"r_x3": 347.2,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 318.9,
"t": 437.7,
"r": 323.3,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.9,
"r_y0": 446.5,
"r_x1": 323.3,
"r_y1": 446.5,
"r_x2": 323.3,
"r_y2": 437.7,
"r_x3": 318.9,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 394.1,
"t": 437.7,
"r": 398.5,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.5,
"r_x1": 398.5,
"r_y1": 446.5,
"r_x2": 398.5,
"r_y2": 437.7,
"r_x3": 394.1,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 318.8,
"t": 449.5,
"r": 323.2,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 458.3,
"r_x1": 323.2,
"r_y1": 458.3,
"r_x2": 323.2,
"r_y2": 449.5,
"r_x3": 318.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 347.2,
"t": 449.5,
"r": 351.6,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 458.3,
"r_x1": 351.6,
"r_y1": 458.3,
"r_x2": 351.6,
"r_y2": 449.5,
"r_x3": 347.2,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 394.1,
"t": 449.5,
"r": 398.5,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.3,
"r_x1": 398.5,
"r_y1": 458.3,
"r_x2": 398.5,
"r_y2": 449.5,
"r_x3": 394.1,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 441.0,
"t": 449.5,
"r": 445.4,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 458.3,
"r_x1": 445.4,
"r_y1": 458.3,
"r_x2": 445.4,
"r_y2": 449.5,
"r_x3": 441.0,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 487.8,
"t": 449.5,
"r": 492.2,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 458.3,
"r_x1": 492.2,
"r_y1": 458.3,
"r_x2": 492.2,
"r_y2": 449.5,
"r_x3": 487.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 318.8,
"t": 473.7,
"r": 323.2,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 482.5,
"r_x1": 323.2,
"r_y1": 482.5,
"r_x2": 323.2,
"r_y2": 473.7,
"r_x3": 318.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 347.2,
"t": 461.8,
"r": 351.6,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 470.6,
"r_x1": 351.6,
"r_y1": 470.6,
"r_x2": 351.6,
"r_y2": 461.8,
"r_x3": 347.2,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 394.1,
"t": 461.8,
"r": 402.9,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.6,
"r_x1": 402.9,
"r_y1": 470.6,
"r_x2": 402.9,
"r_y2": 461.8,
"r_x3": 394.1,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 441.0,
"t": 461.8,
"r": 449.4,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 470.6,
"r_x1": 449.4,
"r_y1": 470.6,
"r_x2": 449.4,
"r_y2": 461.8,
"r_x3": 441.0,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 487.8,
"t": 461.8,
"r": 496.6,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 470.6,
"r_x1": 496.6,
"r_y1": 470.6,
"r_x2": 496.6,
"r_y2": 461.8,
"r_x3": 487.8,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 347.2,
"t": 473.7,
"r": 356.0,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 482.5,
"r_x1": 356.0,
"r_y1": 482.5,
"r_x2": 356.0,
"r_y2": 473.7,
"r_x3": 347.2,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 394.1,
"t": 473.7,
"r": 402.9,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.5,
"r_x1": 402.9,
"r_y1": 482.5,
"r_x2": 402.9,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 441.0,
"t": 473.7,
"r": 449.7,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 482.5,
"r_x1": 449.7,
"r_y1": 482.5,
"r_x2": 449.7,
"r_y2": 473.7,
"r_x3": 441.0,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 487.8,
"t": 473.7,
"r": 496.6,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 482.5,
"r_x1": 496.6,
"r_y1": 482.5,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 347.2,
"t": 485.1,
"r": 356.0,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 493.9,
"r_x1": 356.0,
"r_y1": 493.9,
"r_x2": 356.0,
"r_y2": 485.1,
"r_x3": 347.2,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 394.1,
"t": 485.1,
"r": 402.9,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.9,
"r_x1": 402.9,
"r_y1": 493.9,
"r_x2": 402.9,
"r_y2": 485.1,
"r_x3": 394.1,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 441.0,
"t": 485.1,
"r": 449.7,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 493.9,
"r_x1": 449.7,
"r_y1": 493.9,
"r_x2": 449.7,
"r_y2": 485.1,
"r_x3": 441.0,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 487.8,
"t": 485.1,
"r": 496.6,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 493.9,
"r_x1": 496.6,
"r_y1": 493.9,
"r_x2": 496.6,
"r_y2": 485.1,
"r_x3": 487.8,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 366.7,
"t": 449.1,
"r": 372.7,
"b": 459.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.3,
"r_x1": 372.7,
"r_y1": 459.3,
"r_x2": 372.7,
"r_y2": 449.1,
"r_x3": 366.7,
"r_y3": 449.1,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 331.9,
"t": 473.3,
"r": 337.9,
"b": 483.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.5,
"r_x1": 337.9,
"r_y1": 483.5,
"r_x2": 337.9,
"r_y2": 473.3,
"r_x3": 331.9,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 459.9,
"t": 437.6,
"r": 465.9,
"b": 447.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.9,
"r_y0": 447.7,
"r_x1": 465.9,
"r_y1": 447.7,
"r_x2": 465.9,
"r_y2": 437.6,
"r_x3": 459.9,
"r_y3": 437.6,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"lcel",
"lcel",
"lcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 5,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 347.2,
"t": 437.7,
"r": 351.6,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 4,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 5,
"text": "1 2 1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 318.9,
"t": 437.7,
"r": 323.3,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 318.8,
"t": 449.5,
"r": 323.2,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.2,
"t": 449.1,
"r": 372.7,
"b": 459.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "4 3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 449.5,
"r": 398.5,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 441.0,
"t": 449.5,
"r": 445.4,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.8,
"t": 449.5,
"r": 492.2,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 318.8,
"t": 473.7,
"r": 323.2,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "8 2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.2,
"t": 461.8,
"r": 351.6,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 461.8,
"r": 402.9,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "10",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 441.0,
"t": 461.8,
"r": 449.4,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "11",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.8,
"t": 461.8,
"r": 496.6,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "12",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.2,
"t": 473.7,
"r": 356.0,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "13",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 473.7,
"r": 402.9,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "14",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 441.0,
"t": 473.7,
"r": 449.7,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "15",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.8,
"t": 473.7,
"r": 496.6,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "16",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.2,
"t": 485.1,
"r": 356.0,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "17",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 485.1,
"r": 402.9,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "18",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 441.0,
"t": 485.1,
"r": 449.7,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "19",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.8,
"t": 485.1,
"r": 496.6,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "20",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "picture",
"id": 16,
"page_no": 0,
"cluster": {
"id": 16,
"label": "picture",
"bbox": {
"l": 315.7,
"t": 228.7,
"r": 537.1,
"b": 302.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.61,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.9,
"r_y0": 245.5,
"r_x1": 458.0,
"r_y1": 245.5,
"r_x2": 458.0,
"r_y2": 235.3,
"r_x3": 451.9,
"r_y3": 235.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.5,
"r_x1": 337.2,
"r_y1": 279.5,
"r_x2": 337.2,
"r_y2": 269.4,
"r_x3": 331.2,
"r_y3": 269.4,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.0,
"r_y0": 262.8,
"r_x1": 390.0,
"r_y1": 262.8,
"r_x2": 390.0,
"r_y2": 252.7,
"r_x3": 384.0,
"r_y3": 252.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 83,
"label": "text",
"bbox": {
"l": 451.9,
"t": 235.3,
"r": 458.0,
"b": 245.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.9,
"r_y0": 245.5,
"r_x1": 458.0,
"r_y1": 245.5,
"r_x2": 458.0,
"r_y2": 235.3,
"r_x3": 451.9,
"r_y3": 235.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 331.2,
"t": 269.4,
"r": 337.2,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.5,
"r_x1": 337.2,
"r_y1": 279.5,
"r_x2": 337.2,
"r_y2": 269.4,
"r_x3": 331.2,
"r_y3": 269.4,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 384.0,
"t": 252.7,
"r": 390.0,
"b": 262.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.0,
"r_y0": 262.8,
"r_x1": 390.0,
"r_y1": 262.8,
"r_x2": 390.0,
"r_y2": 252.7,
"r_x3": 384.0,
"r_y3": 252.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 15,
"page_no": 0,
"cluster": {
"id": 15,
"label": "table",
"bbox": {
"l": 315.7,
"t": 228.7,
"r": 537.1,
"b": 302.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.65,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.9,
"r_y0": 245.5,
"r_x1": 458.0,
"r_y1": 245.5,
"r_x2": 458.0,
"r_y2": 235.3,
"r_x3": 451.9,
"r_y3": 235.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.5,
"r_x1": 337.2,
"r_y1": 279.5,
"r_x2": 337.2,
"r_y2": 269.4,
"r_x3": 331.2,
"r_y3": 269.4,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.0,
"r_y0": 262.8,
"r_x1": 390.0,
"r_y1": 262.8,
"r_x2": 390.0,
"r_y2": 252.7,
"r_x3": 384.0,
"r_y3": 252.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 83,
"label": "text",
"bbox": {
"l": 451.9,
"t": 235.3,
"r": 458.0,
"b": 245.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.9,
"r_y0": 245.5,
"r_x1": 458.0,
"r_y1": 245.5,
"r_x2": 458.0,
"r_y2": 235.3,
"r_x3": 451.9,
"r_y3": 235.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 331.2,
"t": 269.4,
"r": 337.2,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.5,
"r_x1": 337.2,
"r_y1": 279.5,
"r_x2": 337.2,
"r_y2": 269.4,
"r_x3": 331.2,
"r_y3": 269.4,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 384.0,
"t": 252.7,
"r": 390.0,
"b": 262.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.0,
"r_y0": 262.8,
"r_x1": 390.0,
"r_y1": 262.8,
"r_x2": 390.0,
"r_y2": 252.7,
"r_x3": 384.0,
"r_y3": 252.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"ucel",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"ucel",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 1,
"num_cols": 1,
"table_cells": [
{
"bbox": {
"l": 451.9,
"t": 235.3,
"r": 458.0,
"b": 245.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "1",
"column_header": true,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 6,
"page_no": 0,
"cluster": {
"id": 6,
"label": "caption",
"bbox": {
"l": 308.9,
"t": 514.5,
"r": 545.1,
"b": 559.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.92,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 523.4,
"r_x1": 345.7,
"r_y1": 523.4,
"r_x2": 345.7,
"r_y2": 514.5,
"r_x3": 308.9,
"r_y3": 514.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 1:",
"orig": "Figure 1:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 353.2,
"r_y0": 523.4,
"r_x1": 545.1,
"r_y1": 523.4,
"r_x2": 545.1,
"r_y2": 514.5,
"r_x3": 353.2,
"r_y3": 514.5,
"coord_origin": "TOPLEFT"
},
"text": "Picture of a table with subtle, complex features",
"orig": "Picture of a table with subtle, complex features",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 535.4,
"r_x1": 545.1,
"r_y1": 535.4,
"r_x2": 545.1,
"r_y2": 526.5,
"r_x3": 308.9,
"r_y3": 526.5,
"coord_origin": "TOPLEFT"
},
"text": "such as (1) multi-column headers, (2) cell with multi-row",
"orig": "such as (1) multi-column headers, (2) cell with multi-row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 547.3,
"r_x1": 545.1,
"r_y1": 547.3,
"r_x2": 545.1,
"r_y2": 538.4,
"r_x3": 308.9,
"r_y3": 538.4,
"coord_origin": "TOPLEFT"
},
"text": "text and (3) cells with no content. Image from PubTabNet",
"orig": "text and (3) cells with no content. Image from PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 559.3,
"r_x1": 505.7,
"r_y1": 559.3,
"r_x2": 505.7,
"r_y2": 550.4,
"r_x3": 308.9,
"r_y3": 550.4,
"coord_origin": "TOPLEFT"
},
"text": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.",
"orig": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 1: Picture of a table with subtle, complex features such as (1) multi-column headers, (2) cell with multi-row text and (3) cells with no content. Image from PubTabNet evaluation set, filename: 'PMC2944238 004 02'."
},
{
"label": "text",
"id": 0,
"page_no": 0,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 308.9,
"t": 584.4,
"r": 545.1,
"b": 665.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 593.3,
"r_x1": 545.1,
"r_y1": 593.3,
"r_x2": 545.1,
"r_y2": 584.4,
"r_x3": 320.8,
"r_y3": 584.4,
"coord_origin": "TOPLEFT"
},
"text": "Recently, significant progress has been made with vi-",
"orig": "Recently, significant progress has been made with vi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 605.3,
"r_x1": 545.1,
"r_y1": 605.3,
"r_x2": 545.1,
"r_y2": 596.4,
"r_x3": 308.9,
"r_y3": 596.4,
"coord_origin": "TOPLEFT"
},
"text": "sion based approaches to extract tables in documents. For",
"orig": "sion based approaches to extract tables in documents. For",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 617.2,
"r_x1": 545.1,
"r_y1": 617.2,
"r_x2": 545.1,
"r_y2": 608.3,
"r_x3": 308.9,
"r_y3": 608.3,
"coord_origin": "TOPLEFT"
},
"text": "the sake of completeness, the issue of table extraction from",
"orig": "the sake of completeness, the issue of table extraction from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 629.2,
"r_x1": 545.1,
"r_y1": 629.2,
"r_x2": 545.1,
"r_y2": 620.3,
"r_x3": 308.9,
"r_y3": 620.3,
"coord_origin": "TOPLEFT"
},
"text": "documents is typically decomposed into two separate chal-",
"orig": "documents is typically decomposed into two separate chal-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 641.1,
"r_x1": 353.7,
"r_y1": 641.1,
"r_x2": 353.7,
"r_y2": 632.2,
"r_x3": 308.9,
"r_y3": 632.2,
"coord_origin": "TOPLEFT"
},
"text": "lenges, i.e.",
"orig": "lenges, i.e.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 362.1,
"r_y0": 641.1,
"r_x1": 374.7,
"r_y1": 641.1,
"r_x2": 374.7,
"r_y2": 632.2,
"r_x3": 362.1,
"r_y3": 632.2,
"coord_origin": "TOPLEFT"
},
"text": "(1)",
"orig": "(1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 377.4,
"r_y0": 641.1,
"r_x1": 545.1,
"r_y1": 641.1,
"r_x2": 545.1,
"r_y2": 632.2,
"r_x3": 377.4,
"r_y3": 632.2,
"coord_origin": "TOPLEFT"
},
"text": "finding the location of the table(s) on a",
"orig": "finding the location of the table(s) on a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 653.1,
"r_x1": 545.1,
"r_y1": 653.1,
"r_x2": 545.1,
"r_y2": 644.2,
"r_x3": 308.9,
"r_y3": 644.2,
"coord_origin": "TOPLEFT"
},
"text": "document-page and (2) finding the structure of a given table",
"orig": "document-page and (2) finding the structure of a given table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 665.0,
"r_x1": 375.6,
"r_y1": 665.0,
"r_x2": 375.6,
"r_y2": 656.1,
"r_x3": 308.9,
"r_y3": 656.1,
"coord_origin": "TOPLEFT"
},
"text": "in the document.",
"orig": "in the document.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Recently, significant progress has been made with vision based approaches to extract tables in documents. For the sake of completeness, the issue of table extraction from documents is typically decomposed into two separate challenges, i.e. (1) finding the location of the table(s) on a document-page and (2) finding the structure of a given table in the document."
},
{
"label": "text",
"id": 3,
"page_no": 0,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 308.9,
"t": 668.4,
"r": 545.1,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 677.3,
"r_x1": 545.1,
"r_y1": 677.3,
"r_x2": 545.1,
"r_y2": 668.4,
"r_x3": 320.8,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "The first problem is called table-location and has been",
"orig": "The first problem is called table-location and has been",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 689.2,
"r_x1": 545.1,
"r_y1": 689.2,
"r_x2": 545.1,
"r_y2": 680.3,
"r_x3": 308.9,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-",
"orig": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 308.9,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "of-the-art object-detection networks (e.g. YOLO and later",
"orig": "of-the-art object-detection networks (e.g. YOLO and later",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 545.1,
"r_y1": 713.2,
"r_x2": 545.1,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "on Mask-RCNN [9]). For all practical purposes, it can be",
"orig": "on Mask-RCNN [9]). For all practical purposes, it can be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The first problem is called table-location and has been previously addressed [30, 38, 19, 21, 23, 26, 8] with stateof-the-art object-detection networks (e.g. YOLO and later on Mask-RCNN [9]). For all practical purposes, it can be"
},
{
"label": "page_footer",
"id": 12,
"page_no": 0,
"cluster": {
"id": 12,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.8,
"cells": [
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1"
},
{
"label": "page_header",
"id": 9,
"page_no": 0,
"cluster": {
"id": 9,
"label": "page_header",
"bbox": {
"l": 18.3,
"t": 207.8,
"r": 36.3,
"b": 560.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 18.3,
"r_y0": 560.0,
"r_x1": 36.3,
"r_y1": 560.0,
"r_x2": 36.3,
"r_y2": 207.8,
"r_x3": 18.3,
"r_y3": 207.8,
"coord_origin": "TOPLEFT"
},
"text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022",
"orig": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022"
}
],
"body": [
{
"label": "section_header",
"id": 8,
"page_no": 0,
"cluster": {
"id": 8,
"label": "section_header",
"bbox": {
"l": 96.3,
"t": 107.0,
"r": 498.9,
"b": 119.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 96.3,
"r_y0": 119.9,
"r_x1": 498.9,
"r_y1": 119.9,
"r_x2": 498.9,
"r_y2": 107.0,
"r_x3": 96.3,
"r_y3": 107.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer: Table Structure Understanding with Transformers.",
"orig": "TableFormer: Table Structure Understanding with Transformers.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TableFormer: Table Structure Understanding with Transformers."
},
{
"label": "section_header",
"id": 13,
"page_no": 0,
"cluster": {
"id": 13,
"label": "section_header",
"bbox": {
"l": 142.5,
"t": 146.7,
"r": 452.8,
"b": 171.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.76,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 142.5,
"r_y0": 157.4,
"r_x1": 452.8,
"r_y1": 157.4,
"r_x2": 452.8,
"r_y2": 146.7,
"r_x3": 142.5,
"r_y3": 146.7,
"coord_origin": "TOPLEFT"
},
"text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar",
"orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.9,
"r_y0": 171.3,
"r_x1": 332.3,
"r_y1": 171.3,
"r_x2": 332.3,
"r_y2": 160.6,
"r_x3": 262.9,
"r_y3": 160.6,
"coord_origin": "TOPLEFT"
},
"text": "IBM Research",
"orig": "IBM Research",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar IBM Research"
},
{
"label": "key_value_region",
"id": 25,
"page_no": 0,
"cluster": {
"id": 25,
"label": "key_value_region",
"bbox": {
"l": 208.1,
"t": 176.0,
"r": 378.7,
"b": 184.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.49,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.1,
"r_y0": 184.4,
"r_x1": 212.7,
"r_y1": 184.4,
"r_x2": 212.7,
"r_y2": 176.0,
"r_x3": 208.1,
"r_y3": 176.0,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 212.7,
"r_y0": 184.0,
"r_x1": 293.4,
"r_y1": 184.0,
"r_x2": 293.4,
"r_y2": 177.1,
"r_x3": 212.7,
"r_y3": 177.1,
"coord_origin": "TOPLEFT"
},
"text": "ahn,nli,mly,taa",
"orig": "ahn,nli,mly,taa",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 293.4,
"r_y0": 184.4,
"r_x1": 298.0,
"r_y1": 184.4,
"r_x2": 298.0,
"r_y2": 176.0,
"r_x3": 293.4,
"r_y3": 176.0,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 298.0,
"r_y0": 184.0,
"r_x1": 378.7,
"r_y1": 184.0,
"r_x2": 378.7,
"r_y2": 177.1,
"r_x3": 298.0,
"r_y3": 177.1,
"coord_origin": "TOPLEFT"
},
"text": "@zurich.ibm.com",
"orig": "@zurich.ibm.com",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 7,
"label": "text",
"bbox": {
"l": 208.1,
"t": 176.0,
"r": 378.7,
"b": 184.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.1,
"r_y0": 184.4,
"r_x1": 212.7,
"r_y1": 184.4,
"r_x2": 212.7,
"r_y2": 176.0,
"r_x3": 208.1,
"r_y3": 176.0,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 212.7,
"r_y0": 184.0,
"r_x1": 293.4,
"r_y1": 184.0,
"r_x2": 293.4,
"r_y2": 177.1,
"r_x3": 212.7,
"r_y3": 177.1,
"coord_origin": "TOPLEFT"
},
"text": "ahn,nli,mly,taa",
"orig": "ahn,nli,mly,taa",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 293.4,
"r_y0": 184.4,
"r_x1": 298.0,
"r_y1": 184.4,
"r_x2": 298.0,
"r_y2": 176.0,
"r_x3": 293.4,
"r_y3": 176.0,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 298.0,
"r_y0": 184.0,
"r_x1": 378.7,
"r_y1": 184.0,
"r_x2": 378.7,
"r_y2": 177.1,
"r_x3": 298.0,
"r_y3": 177.1,
"coord_origin": "TOPLEFT"
},
"text": "@zurich.ibm.com",
"orig": "@zurich.ibm.com",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null
},
{
"label": "section_header",
"id": 5,
"page_no": 0,
"cluster": {
"id": 5,
"label": "section_header",
"bbox": {
"l": 146.0,
"t": 215.5,
"r": 190.5,
"b": 226.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 146.0,
"r_y0": 226.2,
"r_x1": 190.5,
"r_y1": 226.2,
"r_x2": 190.5,
"r_y2": 215.5,
"r_x3": 146.0,
"r_y3": 215.5,
"coord_origin": "TOPLEFT"
},
"text": "Abstract",
"orig": "Abstract",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Abstract"
},
{
"label": "text",
"id": 2,
"page_no": 0,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 50.1,
"t": 241.4,
"r": 286.4,
"b": 513.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 250.0,
"r_x1": 286.4,
"r_y1": 250.0,
"r_x2": 286.4,
"r_y2": 241.4,
"r_x3": 62.1,
"r_y3": 241.4,
"coord_origin": "TOPLEFT"
},
"text": "Tables organize valuable content in a concise and com-",
"orig": "Tables organize valuable content in a concise and com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 261.9,
"r_x1": 286.4,
"r_y1": 261.9,
"r_x2": 286.4,
"r_y2": 253.4,
"r_x3": 50.1,
"r_y3": 253.4,
"coord_origin": "TOPLEFT"
},
"text": "pact representation. This content is extremely valuable for",
"orig": "pact representation. This content is extremely valuable for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 273.9,
"r_x1": 286.4,
"r_y1": 273.9,
"r_x2": 286.4,
"r_y2": 265.3,
"r_x3": 50.1,
"r_y3": 265.3,
"coord_origin": "TOPLEFT"
},
"text": "systems such as search engines, Knowledge Graph\u2019s, etc,",
"orig": "systems such as search engines, Knowledge Graph\u2019s, etc,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 285.8,
"r_x1": 286.4,
"r_y1": 285.8,
"r_x2": 286.4,
"r_y2": 277.3,
"r_x3": 50.1,
"r_y3": 277.3,
"coord_origin": "TOPLEFT"
},
"text": "since they enhance their predictive capabilities. Unfortu-",
"orig": "since they enhance their predictive capabilities. Unfortu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 297.8,
"r_x1": 286.4,
"r_y1": 297.8,
"r_x2": 286.4,
"r_y2": 289.2,
"r_x3": 50.1,
"r_y3": 289.2,
"coord_origin": "TOPLEFT"
},
"text": "nately, tables come in a large variety of shapes and sizes.",
"orig": "nately, tables come in a large variety of shapes and sizes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 309.8,
"r_x1": 286.4,
"r_y1": 309.8,
"r_x2": 286.4,
"r_y2": 301.2,
"r_x3": 50.1,
"r_y3": 301.2,
"coord_origin": "TOPLEFT"
},
"text": "Furthermore, they can have complex column/row-header",
"orig": "Furthermore, they can have complex column/row-header",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 321.7,
"r_x1": 286.4,
"r_y1": 321.7,
"r_x2": 286.4,
"r_y2": 313.1,
"r_x3": 50.1,
"r_y3": 313.1,
"coord_origin": "TOPLEFT"
},
"text": "configurations, multiline rows, different variety of separa-",
"orig": "configurations, multiline rows, different variety of separa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 333.7,
"r_x1": 286.4,
"r_y1": 333.7,
"r_x2": 286.4,
"r_y2": 325.1,
"r_x3": 50.1,
"r_y3": 325.1,
"coord_origin": "TOPLEFT"
},
"text": "tion lines, missing entries, etc. As such, the correct iden-",
"orig": "tion lines, missing entries, etc. As such, the correct iden-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 345.6,
"r_x1": 286.4,
"r_y1": 345.6,
"r_x2": 286.4,
"r_y2": 337.0,
"r_x3": 50.1,
"r_y3": 337.0,
"coord_origin": "TOPLEFT"
},
"text": "tification of the table-structure from an image is a non-",
"orig": "tification of the table-structure from an image is a non-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 357.6,
"r_x1": 286.4,
"r_y1": 357.6,
"r_x2": 286.4,
"r_y2": 349.0,
"r_x3": 50.1,
"r_y3": 349.0,
"coord_origin": "TOPLEFT"
},
"text": "trivial task. In this paper, we present a new table-structure",
"orig": "trivial task. In this paper, we present a new table-structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 369.5,
"r_x1": 286.4,
"r_y1": 369.5,
"r_x2": 286.4,
"r_y2": 360.9,
"r_x3": 50.1,
"r_y3": 360.9,
"coord_origin": "TOPLEFT"
},
"text": "identification model. The latter improves the latest end-to-",
"orig": "identification model. The latter improves the latest end-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 381.5,
"r_x1": 286.4,
"r_y1": 381.5,
"r_x2": 286.4,
"r_y2": 372.9,
"r_x3": 50.1,
"r_y3": 372.9,
"coord_origin": "TOPLEFT"
},
"text": "end deep learning model (i.e. encoder-dual-decoder from",
"orig": "end deep learning model (i.e. encoder-dual-decoder from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 393.4,
"r_x1": 286.4,
"r_y1": 393.4,
"r_x2": 286.4,
"r_y2": 384.9,
"r_x3": 50.1,
"r_y3": 384.9,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet) in two significant ways. First, we introduce a",
"orig": "PubTabNet) in two significant ways. First, we introduce a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 405.4,
"r_x1": 286.4,
"r_y1": 405.4,
"r_x2": 286.4,
"r_y2": 396.8,
"r_x3": 50.1,
"r_y3": 396.8,
"coord_origin": "TOPLEFT"
},
"text": "new object detection decoder for table-cells. In this way,",
"orig": "new object detection decoder for table-cells. In this way,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 417.4,
"r_x1": 286.4,
"r_y1": 417.4,
"r_x2": 286.4,
"r_y2": 408.8,
"r_x3": 50.1,
"r_y3": 408.8,
"coord_origin": "TOPLEFT"
},
"text": "we can obtain the content of the table-cells from program-",
"orig": "we can obtain the content of the table-cells from program-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 429.3,
"r_x1": 286.4,
"r_y1": 429.3,
"r_x2": 286.4,
"r_y2": 420.7,
"r_x3": 50.1,
"r_y3": 420.7,
"coord_origin": "TOPLEFT"
},
"text": "matic PDF\u2019s directly from the PDF source and avoid the",
"orig": "matic PDF\u2019s directly from the PDF source and avoid the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 441.3,
"r_x1": 207.2,
"r_y1": 441.3,
"r_x2": 207.2,
"r_y2": 432.7,
"r_x3": 50.1,
"r_y3": 432.7,
"coord_origin": "TOPLEFT"
},
"text": "training of the custom OCR decoders.",
"orig": "training of the custom OCR decoders.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 214.1,
"r_y0": 441.3,
"r_x1": 286.4,
"r_y1": 441.3,
"r_x2": 286.4,
"r_y2": 432.7,
"r_x3": 214.1,
"r_y3": 432.7,
"coord_origin": "TOPLEFT"
},
"text": "This architectural",
"orig": "This architectural",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 453.2,
"r_x1": 286.4,
"r_y1": 453.2,
"r_x2": 286.4,
"r_y2": 444.6,
"r_x3": 50.1,
"r_y3": 444.6,
"coord_origin": "TOPLEFT"
},
"text": "change leads to more accurate table-content extraction and",
"orig": "change leads to more accurate table-content extraction and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 465.2,
"r_x1": 286.4,
"r_y1": 465.2,
"r_x2": 286.4,
"r_y2": 456.6,
"r_x3": 50.1,
"r_y3": 456.6,
"coord_origin": "TOPLEFT"
},
"text": "allows us to tackle non-english tables. Second, we replace",
"orig": "allows us to tackle non-english tables. Second, we replace",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 477.1,
"r_x1": 286.4,
"r_y1": 477.1,
"r_x2": 286.4,
"r_y2": 468.5,
"r_x3": 50.1,
"r_y3": 468.5,
"coord_origin": "TOPLEFT"
},
"text": "the LSTM decoders with transformer based decoders. This",
"orig": "the LSTM decoders with transformer based decoders. This",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 489.1,
"r_x1": 286.4,
"r_y1": 489.1,
"r_x2": 286.4,
"r_y2": 480.5,
"r_x3": 50.1,
"r_y3": 480.5,
"coord_origin": "TOPLEFT"
},
"text": "upgrade improves significantly the previous state-of-the-art",
"orig": "upgrade improves significantly the previous state-of-the-art",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 501.0,
"r_x1": 286.4,
"r_y1": 501.0,
"r_x2": 286.4,
"r_y2": 492.5,
"r_x3": 50.1,
"r_y3": 492.5,
"coord_origin": "TOPLEFT"
},
"text": "tree-editing-distance-score (TEDS) from 91% to 98.5% on",
"orig": "tree-editing-distance-score (TEDS) from 91% to 98.5% on",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 513.0,
"r_x1": 276.7,
"r_y1": 513.0,
"r_x2": 276.7,
"r_y2": 504.4,
"r_x3": 50.1,
"r_y3": 504.4,
"coord_origin": "TOPLEFT"
},
"text": "simple tables and from 88.7% to 95% on complex tables.",
"orig": "simple tables and from 88.7% to 95% on complex tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Tables organize valuable content in a concise and compact representation. This content is extremely valuable for systems such as search engines, Knowledge Graph's, etc, since they enhance their predictive capabilities. Unfortunately, tables come in a large variety of shapes and sizes. Furthermore, they can have complex column/row-header configurations, multiline rows, different variety of separation lines, missing entries, etc. As such, the correct identification of the table-structure from an image is a nontrivial task. In this paper, we present a new table-structure identification model. The latter improves the latest end-toend deep learning model (i.e. encoder-dual-decoder from PubTabNet) in two significant ways. First, we introduce a new object detection decoder for table-cells. In this way, we can obtain the content of the table-cells from programmatic PDF's directly from the PDF source and avoid the training of the custom OCR decoders. This architectural change leads to more accurate table-content extraction and allows us to tackle non-english tables. Second, we replace the LSTM decoders with transformer based decoders. This upgrade improves significantly the previous state-of-the-art tree-editing-distance-score (TEDS) from 91% to 98.5% on simple tables and from 88.7% to 95% on complex tables."
},
{
"label": "section_header",
"id": 4,
"page_no": 0,
"cluster": {
"id": 4,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 539.9,
"r": 126.9,
"b": 550.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 550.7,
"r_x1": 58.1,
"r_y1": 550.7,
"r_x2": 58.1,
"r_y2": 539.9,
"r_x3": 50.1,
"r_y3": 539.9,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.8,
"r_y0": 550.7,
"r_x1": 126.9,
"r_y1": 550.7,
"r_x2": 126.9,
"r_y2": 539.9,
"r_x3": 68.8,
"r_y3": 539.9,
"coord_origin": "TOPLEFT"
},
"text": "Introduction",
"orig": "Introduction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1. Introduction"
},
{
"label": "text",
"id": 1,
"page_no": 0,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.1,
"t": 560.8,
"r": 286.4,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 569.7,
"r_x1": 286.4,
"r_y1": 569.7,
"r_x2": 286.4,
"r_y2": 560.8,
"r_x3": 62.1,
"r_y3": 560.8,
"coord_origin": "TOPLEFT"
},
"text": "The occurrence of tables in documents is ubiquitous.",
"orig": "The occurrence of tables in documents is ubiquitous.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 581.6,
"r_x1": 286.4,
"r_y1": 581.6,
"r_x2": 286.4,
"r_y2": 572.7,
"r_x3": 50.1,
"r_y3": 572.7,
"coord_origin": "TOPLEFT"
},
"text": "They often summarise quantitative or factual data, which is",
"orig": "They often summarise quantitative or factual data, which is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 593.6,
"r_x1": 286.4,
"r_y1": 593.6,
"r_x2": 286.4,
"r_y2": 584.7,
"r_x3": 50.1,
"r_y3": 584.7,
"coord_origin": "TOPLEFT"
},
"text": "cumbersome to describe in verbose text but nevertheless ex-",
"orig": "cumbersome to describe in verbose text but nevertheless ex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 605.6,
"r_x1": 286.4,
"r_y1": 605.6,
"r_x2": 286.4,
"r_y2": 596.6,
"r_x3": 50.1,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "tremely valuable. Unfortunately, this compact representa-",
"orig": "tremely valuable. Unfortunately, this compact representa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 617.5,
"r_x1": 286.4,
"r_y1": 617.5,
"r_x2": 286.4,
"r_y2": 608.6,
"r_x3": 50.1,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "tion is often not easy to parse by machines. There are many",
"orig": "tion is often not easy to parse by machines. There are many",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 629.5,
"r_x1": 286.4,
"r_y1": 629.5,
"r_x2": 286.4,
"r_y2": 620.6,
"r_x3": 50.1,
"r_y3": 620.6,
"coord_origin": "TOPLEFT"
},
"text": "implicit conventions used to obtain a compact table repre-",
"orig": "implicit conventions used to obtain a compact table repre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 641.4,
"r_x1": 286.4,
"r_y1": 641.4,
"r_x2": 286.4,
"r_y2": 632.5,
"r_x3": 50.1,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": "sentation. For example, tables often have complex column-",
"orig": "sentation. For example, tables often have complex column-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 653.4,
"r_x1": 286.4,
"r_y1": 653.4,
"r_x2": 286.4,
"r_y2": 644.5,
"r_x3": 50.1,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "and row-headers in order to reduce duplicated cell content.",
"orig": "and row-headers in order to reduce duplicated cell content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 665.3,
"r_x1": 286.4,
"r_y1": 665.3,
"r_x2": 286.4,
"r_y2": 656.4,
"r_x3": 50.1,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "Lines of different shapes and sizes are leveraged to separate",
"orig": "Lines of different shapes and sizes are leveraged to separate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.3,
"r_x1": 286.4,
"r_y1": 677.3,
"r_x2": 286.4,
"r_y2": 668.4,
"r_x3": 50.1,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "content or indicate a tree structure. Additionally, tables can",
"orig": "content or indicate a tree structure. Additionally, tables can",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 689.2,
"r_x1": 286.4,
"r_y1": 689.2,
"r_x2": 286.4,
"r_y2": 680.3,
"r_x3": 50.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "also have empty/missing table-entries or multi-row textual",
"orig": "also have empty/missing table-entries or multi-row textual",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "table-entries. Fig. 1 shows a table which presents all these",
"orig": "table-entries. Fig. 1 shows a table which presents all these",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 76.4,
"r_y1": 713.2,
"r_x2": 76.4,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "issues.",
"orig": "issues.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The occurrence of tables in documents is ubiquitous. They often summarise quantitative or factual data, which is cumbersome to describe in verbose text but nevertheless extremely valuable. Unfortunately, this compact representation is often not easy to parse by machines. There are many implicit conventions used to obtain a compact table representation. For example, tables often have complex columnand row-headers in order to reduce duplicated cell content. Lines of different shapes and sizes are leveraged to separate content or indicate a tree structure. Additionally, tables can also have empty/missing table-entries or multi-row textual table-entries. Fig. 1 shows a table which presents all these issues."
},
{
"label": "section_header",
"id": 14,
"page_no": 0,
"cluster": {
"id": 14,
"label": "section_header",
"bbox": {
"l": 315.6,
"t": 218.0,
"r": 408.4,
"b": 226.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.67,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.6,
"r_y0": 226.8,
"r_x1": 324.0,
"r_y1": 226.8,
"r_x2": 324.0,
"r_y2": 218.0,
"r_x3": 315.6,
"r_y3": 218.0,
"coord_origin": "TOPLEFT"
},
"text": "a.",
"orig": "a.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.2,
"r_y0": 226.8,
"r_x1": 408.4,
"r_y1": 226.8,
"r_x2": 408.4,
"r_y2": 218.0,
"r_x3": 328.2,
"r_y3": 218.0,
"coord_origin": "TOPLEFT"
},
"text": "Picture of a table:",
"orig": "Picture of a table:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "a. Picture of a table:"
},
{
"label": "list_item",
"id": 17,
"page_no": 0,
"cluster": {
"id": 17,
"label": "list_item",
"bbox": {
"l": 315.6,
"t": 313.7,
"r": 486.4,
"b": 333.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.6,
"r_y0": 322.4,
"r_x1": 325.1,
"r_y1": 322.4,
"r_x2": 325.1,
"r_y2": 313.7,
"r_x3": 315.6,
"r_y3": 313.7,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.8,
"r_y0": 322.4,
"r_x1": 486.4,
"r_y1": 322.4,
"r_x2": 486.4,
"r_y2": 313.7,
"r_x3": 329.8,
"r_y3": 313.7,
"coord_origin": "TOPLEFT"
},
"text": "Red-annotation of bounding boxes,",
"orig": "Red-annotation of bounding boxes,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.5,
"r_y0": 333.2,
"r_x1": 472.5,
"r_y1": 333.2,
"r_x2": 472.5,
"r_y2": 324.5,
"r_x3": 326.5,
"r_y3": 324.5,
"coord_origin": "TOPLEFT"
},
"text": "Blue-predictions by TableFormer",
"orig": "Blue-predictions by TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "b. Red-annotation of bounding boxes, Blue-predictions by TableFormer"
},
{
"label": "list_item",
"id": 18,
"page_no": 0,
"cluster": {
"id": 18,
"label": "list_item",
"bbox": {
"l": 315.6,
"t": 420.2,
"r": 491.2,
"b": 428.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.6,
"r_y0": 428.9,
"r_x1": 324.8,
"r_y1": 428.9,
"r_x2": 324.8,
"r_y2": 420.2,
"r_x3": 315.6,
"r_y3": 420.2,
"coord_origin": "TOPLEFT"
},
"text": "c.",
"orig": "c.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.4,
"r_y0": 428.9,
"r_x1": 491.2,
"r_y1": 428.9,
"r_x2": 491.2,
"r_y2": 420.2,
"r_x3": 329.4,
"r_y3": 420.2,
"coord_origin": "TOPLEFT"
},
"text": "Structure predicted by TableFormer:",
"orig": "Structure predicted by TableFormer:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "c. Structure predicted by TableFormer:"
},
{
"label": "picture",
"id": 10,
"page_no": 0,
"cluster": {
"id": 10,
"label": "picture",
"bbox": {
"l": 314.8,
"t": 338.1,
"r": 539.2,
"b": 410.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.87,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.1,
"r_y0": 351.6,
"r_x1": 412.5,
"r_y1": 351.6,
"r_x2": 412.5,
"r_y2": 342.8,
"r_x3": 408.1,
"r_y3": 342.8,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.1,
"r_y0": 350.4,
"r_x1": 360.5,
"r_y1": 350.4,
"r_x2": 360.5,
"r_y2": 341.6,
"r_x3": 356.1,
"r_y3": 341.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.7,
"r_y0": 349.7,
"r_x1": 505.1,
"r_y1": 349.7,
"r_x2": 505.1,
"r_y2": 340.9,
"r_x3": 500.7,
"r_y3": 340.9,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.1,
"r_y0": 360.5,
"r_x1": 360.5,
"r_y1": 360.5,
"r_x2": 360.5,
"r_y2": 351.7,
"r_x3": 356.1,
"r_y3": 351.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 402.5,
"r_y0": 364.7,
"r_x1": 406.9,
"r_y1": 364.7,
"r_x2": 406.9,
"r_y2": 355.9,
"r_x3": 402.5,
"r_y3": 355.9,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.6,
"r_y0": 361.6,
"r_x1": 453.0,
"r_y1": 361.6,
"r_x2": 453.0,
"r_y2": 352.8,
"r_x3": 448.6,
"r_y3": 352.8,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 491.7,
"r_y0": 362.5,
"r_x1": 496.0,
"r_y1": 362.5,
"r_x2": 496.0,
"r_y2": 353.7,
"r_x3": 491.7,
"r_y3": 353.7,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 535.1,
"r_y0": 362.1,
"r_x1": 539.5,
"r_y1": 362.1,
"r_x2": 539.5,
"r_y2": 353.3,
"r_x3": 535.1,
"r_y3": 353.3,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.8,
"r_y0": 395.9,
"r_x1": 353.2,
"r_y1": 395.9,
"r_x2": 353.2,
"r_y2": 387.1,
"r_x3": 348.8,
"r_y3": 387.1,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.3,
"r_y0": 384.2,
"r_x1": 393.7,
"r_y1": 384.2,
"r_x2": 393.7,
"r_y2": 375.4,
"r_x3": 389.3,
"r_y3": 375.4,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.7,
"r_y0": 384.4,
"r_x1": 451.5,
"r_y1": 384.4,
"r_x2": 451.5,
"r_y2": 375.6,
"r_x3": 442.7,
"r_y3": 375.6,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.4,
"r_y0": 384.3,
"r_x1": 485.9,
"r_y1": 384.3,
"r_x2": 485.9,
"r_y2": 375.5,
"r_x3": 477.4,
"r_y3": 375.5,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 522.6,
"r_y0": 384.4,
"r_x1": 531.4,
"r_y1": 384.4,
"r_x2": 531.4,
"r_y2": 375.6,
"r_x3": 522.6,
"r_y3": 375.6,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.2,
"r_y0": 395.9,
"r_x1": 409.0,
"r_y1": 395.9,
"r_x2": 409.0,
"r_y2": 387.1,
"r_x3": 400.2,
"r_y3": 387.1,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.3,
"r_y0": 395.8,
"r_x1": 451.1,
"r_y1": 395.8,
"r_x2": 451.1,
"r_y2": 387.0,
"r_x3": 442.3,
"r_y3": 387.0,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.2,
"r_y0": 396.2,
"r_x1": 487.0,
"r_y1": 396.2,
"r_x2": 487.0,
"r_y2": 387.4,
"r_x3": 478.2,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 523.2,
"r_y0": 395.8,
"r_x1": 532.0,
"r_y1": 395.8,
"r_x2": 532.0,
"r_y2": 387.0,
"r_x3": 523.2,
"r_y3": 387.0,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.6,
"r_y0": 408.2,
"r_x1": 416.0,
"r_y1": 408.2,
"r_x2": 416.0,
"r_y2": 399.4,
"r_x3": 411.6,
"r_y3": 399.4,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 416.0,
"r_y0": 408.2,
"r_x1": 420.4,
"r_y1": 408.2,
"r_x2": 420.4,
"r_y2": 399.4,
"r_x3": 416.0,
"r_y3": 399.4,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.3,
"r_y0": 407.8,
"r_x1": 451.1,
"r_y1": 407.8,
"r_x2": 451.1,
"r_y2": 399.0,
"r_x3": 442.3,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.8,
"r_y0": 407.8,
"r_x1": 487.6,
"r_y1": 407.8,
"r_x2": 487.6,
"r_y2": 399.0,
"r_x3": 478.8,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 524.0,
"r_y0": 407.4,
"r_x1": 532.8,
"r_y1": 407.4,
"r_x2": 532.8,
"r_y2": 398.6,
"r_x3": 524.0,
"r_y3": 398.6,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.1,
"r_y0": 367.9,
"r_x1": 391.1,
"r_y1": 367.9,
"r_x2": 391.1,
"r_y2": 357.8,
"r_x3": 385.1,
"r_y3": 357.8,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.4,
"r_y0": 390.9,
"r_x1": 339.4,
"r_y1": 390.9,
"r_x2": 339.4,
"r_y2": 380.7,
"r_x3": 333.4,
"r_y3": 380.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.1,
"r_y0": 351.2,
"r_x1": 484.1,
"r_y1": 351.2,
"r_x2": 484.1,
"r_y2": 341.0,
"r_x3": 478.1,
"r_y3": 341.0,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 40,
"label": "text",
"bbox": {
"l": 408.1,
"t": 342.8,
"r": 412.5,
"b": 351.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.1,
"r_y0": 351.6,
"r_x1": 412.5,
"r_y1": 351.6,
"r_x2": 412.5,
"r_y2": 342.8,
"r_x3": 408.1,
"r_y3": 342.8,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 356.1,
"t": 341.6,
"r": 360.5,
"b": 350.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.1,
"r_y0": 350.4,
"r_x1": 360.5,
"r_y1": 350.4,
"r_x2": 360.5,
"r_y2": 341.6,
"r_x3": 356.1,
"r_y3": 341.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 500.7,
"t": 340.9,
"r": 505.1,
"b": 349.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.7,
"r_y0": 349.7,
"r_x1": 505.1,
"r_y1": 349.7,
"r_x2": 505.1,
"r_y2": 340.9,
"r_x3": 500.7,
"r_y3": 340.9,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 356.1,
"t": 351.7,
"r": 360.5,
"b": 360.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 356.1,
"r_y0": 360.5,
"r_x1": 360.5,
"r_y1": 360.5,
"r_x2": 360.5,
"r_y2": 351.7,
"r_x3": 356.1,
"r_y3": 351.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 402.5,
"t": 355.9,
"r": 406.9,
"b": 364.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 402.5,
"r_y0": 364.7,
"r_x1": 406.9,
"r_y1": 364.7,
"r_x2": 406.9,
"r_y2": 355.9,
"r_x3": 402.5,
"r_y3": 355.9,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 448.6,
"t": 352.8,
"r": 453.0,
"b": 361.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.6,
"r_y0": 361.6,
"r_x1": 453.0,
"r_y1": 361.6,
"r_x2": 453.0,
"r_y2": 352.8,
"r_x3": 448.6,
"r_y3": 352.8,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 491.7,
"t": 353.7,
"r": 496.0,
"b": 362.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 491.7,
"r_y0": 362.5,
"r_x1": 496.0,
"r_y1": 362.5,
"r_x2": 496.0,
"r_y2": 353.7,
"r_x3": 491.7,
"r_y3": 353.7,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 535.1,
"t": 353.3,
"r": 539.5,
"b": 362.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 535.1,
"r_y0": 362.1,
"r_x1": 539.5,
"r_y1": 362.1,
"r_x2": 539.5,
"r_y2": 353.3,
"r_x3": 535.1,
"r_y3": 353.3,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 348.8,
"t": 387.1,
"r": 353.2,
"b": 395.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.8,
"r_y0": 395.9,
"r_x1": 353.2,
"r_y1": 395.9,
"r_x2": 353.2,
"r_y2": 387.1,
"r_x3": 348.8,
"r_y3": 387.1,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 389.3,
"t": 375.4,
"r": 393.7,
"b": 384.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.3,
"r_y0": 384.2,
"r_x1": 393.7,
"r_y1": 384.2,
"r_x2": 393.7,
"r_y2": 375.4,
"r_x3": 389.3,
"r_y3": 375.4,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 442.7,
"t": 375.6,
"r": 451.5,
"b": 384.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.7,
"r_y0": 384.4,
"r_x1": 451.5,
"r_y1": 384.4,
"r_x2": 451.5,
"r_y2": 375.6,
"r_x3": 442.7,
"r_y3": 375.6,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 51,
"label": "text",
"bbox": {
"l": 477.4,
"t": 375.5,
"r": 485.9,
"b": 384.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.4,
"r_y0": 384.3,
"r_x1": 485.9,
"r_y1": 384.3,
"r_x2": 485.9,
"r_y2": 375.5,
"r_x3": 477.4,
"r_y3": 375.5,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 52,
"label": "text",
"bbox": {
"l": 522.6,
"t": 375.6,
"r": 531.4,
"b": 384.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 522.6,
"r_y0": 384.4,
"r_x1": 531.4,
"r_y1": 384.4,
"r_x2": 531.4,
"r_y2": 375.6,
"r_x3": 522.6,
"r_y3": 375.6,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 53,
"label": "text",
"bbox": {
"l": 400.2,
"t": 387.1,
"r": 409.0,
"b": 395.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.2,
"r_y0": 395.9,
"r_x1": 409.0,
"r_y1": 395.9,
"r_x2": 409.0,
"r_y2": 387.1,
"r_x3": 400.2,
"r_y3": 387.1,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 54,
"label": "text",
"bbox": {
"l": 442.3,
"t": 387.0,
"r": 451.1,
"b": 395.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.3,
"r_y0": 395.8,
"r_x1": 451.1,
"r_y1": 395.8,
"r_x2": 451.1,
"r_y2": 387.0,
"r_x3": 442.3,
"r_y3": 387.0,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 55,
"label": "text",
"bbox": {
"l": 478.2,
"t": 387.4,
"r": 487.0,
"b": 396.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.2,
"r_y0": 396.2,
"r_x1": 487.0,
"r_y1": 396.2,
"r_x2": 487.0,
"r_y2": 387.4,
"r_x3": 478.2,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 523.2,
"t": 387.0,
"r": 532.0,
"b": 395.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 523.2,
"r_y0": 395.8,
"r_x1": 532.0,
"r_y1": 395.8,
"r_x2": 532.0,
"r_y2": 387.0,
"r_x3": 523.2,
"r_y3": 387.0,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 411.6,
"t": 399.4,
"r": 416.0,
"b": 408.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.6,
"r_y0": 408.2,
"r_x1": 416.0,
"r_y1": 408.2,
"r_x2": 416.0,
"r_y2": 399.4,
"r_x3": 411.6,
"r_y3": 399.4,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 416.0,
"t": 399.4,
"r": 420.4,
"b": 408.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 416.0,
"r_y0": 408.2,
"r_x1": 420.4,
"r_y1": 408.2,
"r_x2": 420.4,
"r_y2": 399.4,
"r_x3": 416.0,
"r_y3": 399.4,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 442.3,
"t": 399.0,
"r": 451.1,
"b": 407.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.3,
"r_y0": 407.8,
"r_x1": 451.1,
"r_y1": 407.8,
"r_x2": 451.1,
"r_y2": 399.0,
"r_x3": 442.3,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 478.8,
"t": 399.0,
"r": 487.6,
"b": 407.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.8,
"r_y0": 407.8,
"r_x1": 487.6,
"r_y1": 407.8,
"r_x2": 487.6,
"r_y2": 399.0,
"r_x3": 478.8,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 524.0,
"t": 398.6,
"r": 532.8,
"b": 407.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 524.0,
"r_y0": 407.4,
"r_x1": 532.8,
"r_y1": 407.4,
"r_x2": 532.8,
"r_y2": 398.6,
"r_x3": 524.0,
"r_y3": 398.6,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 385.1,
"t": 357.8,
"r": 391.1,
"b": 367.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.1,
"r_y0": 367.9,
"r_x1": 391.1,
"r_y1": 367.9,
"r_x2": 391.1,
"r_y2": 357.8,
"r_x3": 385.1,
"r_y3": 357.8,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 333.4,
"t": 380.7,
"r": 339.4,
"b": 390.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.4,
"r_y0": 390.9,
"r_x1": 339.4,
"r_y1": 390.9,
"r_x2": 339.4,
"r_y2": 380.7,
"r_x3": 333.4,
"r_y3": 380.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 478.1,
"t": 341.0,
"r": 484.1,
"b": 351.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 478.1,
"r_y0": 351.2,
"r_x1": 484.1,
"r_y1": 351.2,
"r_x2": 484.1,
"r_y2": 341.0,
"r_x3": 478.1,
"r_y3": 341.0,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 23,
"page_no": 0,
"cluster": {
"id": 23,
"label": "picture",
"bbox": {
"l": 315.7,
"t": 433.8,
"r": 536.8,
"b": 496.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.51,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 446.5,
"r_x1": 351.6,
"r_y1": 446.5,
"r_x2": 351.6,
"r_y2": 437.7,
"r_x3": 347.2,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.9,
"r_y0": 446.5,
"r_x1": 323.3,
"r_y1": 446.5,
"r_x2": 323.3,
"r_y2": 437.7,
"r_x3": 318.9,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.5,
"r_x1": 398.5,
"r_y1": 446.5,
"r_x2": 398.5,
"r_y2": 437.7,
"r_x3": 394.1,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 458.3,
"r_x1": 323.2,
"r_y1": 458.3,
"r_x2": 323.2,
"r_y2": 449.5,
"r_x3": 318.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 458.3,
"r_x1": 351.6,
"r_y1": 458.3,
"r_x2": 351.6,
"r_y2": 449.5,
"r_x3": 347.2,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.3,
"r_x1": 398.5,
"r_y1": 458.3,
"r_x2": 398.5,
"r_y2": 449.5,
"r_x3": 394.1,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 458.3,
"r_x1": 445.4,
"r_y1": 458.3,
"r_x2": 445.4,
"r_y2": 449.5,
"r_x3": 441.0,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 458.3,
"r_x1": 492.2,
"r_y1": 458.3,
"r_x2": 492.2,
"r_y2": 449.5,
"r_x3": 487.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 482.5,
"r_x1": 323.2,
"r_y1": 482.5,
"r_x2": 323.2,
"r_y2": 473.7,
"r_x3": 318.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 470.6,
"r_x1": 351.6,
"r_y1": 470.6,
"r_x2": 351.6,
"r_y2": 461.8,
"r_x3": 347.2,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.6,
"r_x1": 402.9,
"r_y1": 470.6,
"r_x2": 402.9,
"r_y2": 461.8,
"r_x3": 394.1,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 470.6,
"r_x1": 449.4,
"r_y1": 470.6,
"r_x2": 449.4,
"r_y2": 461.8,
"r_x3": 441.0,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 470.6,
"r_x1": 496.6,
"r_y1": 470.6,
"r_x2": 496.6,
"r_y2": 461.8,
"r_x3": 487.8,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 482.5,
"r_x1": 356.0,
"r_y1": 482.5,
"r_x2": 356.0,
"r_y2": 473.7,
"r_x3": 347.2,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.5,
"r_x1": 402.9,
"r_y1": 482.5,
"r_x2": 402.9,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 482.5,
"r_x1": 449.7,
"r_y1": 482.5,
"r_x2": 449.7,
"r_y2": 473.7,
"r_x3": 441.0,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 482.5,
"r_x1": 496.6,
"r_y1": 482.5,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 493.9,
"r_x1": 356.0,
"r_y1": 493.9,
"r_x2": 356.0,
"r_y2": 485.1,
"r_x3": 347.2,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.9,
"r_x1": 402.9,
"r_y1": 493.9,
"r_x2": 402.9,
"r_y2": 485.1,
"r_x3": 394.1,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 493.9,
"r_x1": 449.7,
"r_y1": 493.9,
"r_x2": 449.7,
"r_y2": 485.1,
"r_x3": 441.0,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 493.9,
"r_x1": 496.6,
"r_y1": 493.9,
"r_x2": 496.6,
"r_y2": 485.1,
"r_x3": 487.8,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.3,
"r_x1": 372.7,
"r_y1": 459.3,
"r_x2": 372.7,
"r_y2": 449.1,
"r_x3": 366.7,
"r_y3": 449.1,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.5,
"r_x1": 337.9,
"r_y1": 483.5,
"r_x2": 337.9,
"r_y2": 473.3,
"r_x3": 331.9,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.9,
"r_y0": 447.7,
"r_x1": 465.9,
"r_y1": 447.7,
"r_x2": 465.9,
"r_y2": 437.6,
"r_x3": 459.9,
"r_y3": 437.6,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 62,
"label": "text",
"bbox": {
"l": 347.2,
"t": 437.7,
"r": 351.6,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 446.5,
"r_x1": 351.6,
"r_y1": 446.5,
"r_x2": 351.6,
"r_y2": 437.7,
"r_x3": 347.2,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 318.9,
"t": 437.7,
"r": 323.3,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.9,
"r_y0": 446.5,
"r_x1": 323.3,
"r_y1": 446.5,
"r_x2": 323.3,
"r_y2": 437.7,
"r_x3": 318.9,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 394.1,
"t": 437.7,
"r": 398.5,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.5,
"r_x1": 398.5,
"r_y1": 446.5,
"r_x2": 398.5,
"r_y2": 437.7,
"r_x3": 394.1,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 318.8,
"t": 449.5,
"r": 323.2,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 458.3,
"r_x1": 323.2,
"r_y1": 458.3,
"r_x2": 323.2,
"r_y2": 449.5,
"r_x3": 318.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 347.2,
"t": 449.5,
"r": 351.6,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 458.3,
"r_x1": 351.6,
"r_y1": 458.3,
"r_x2": 351.6,
"r_y2": 449.5,
"r_x3": 347.2,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 394.1,
"t": 449.5,
"r": 398.5,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.3,
"r_x1": 398.5,
"r_y1": 458.3,
"r_x2": 398.5,
"r_y2": 449.5,
"r_x3": 394.1,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 441.0,
"t": 449.5,
"r": 445.4,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 458.3,
"r_x1": 445.4,
"r_y1": 458.3,
"r_x2": 445.4,
"r_y2": 449.5,
"r_x3": 441.0,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 487.8,
"t": 449.5,
"r": 492.2,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 458.3,
"r_x1": 492.2,
"r_y1": 458.3,
"r_x2": 492.2,
"r_y2": 449.5,
"r_x3": 487.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 318.8,
"t": 473.7,
"r": 323.2,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 482.5,
"r_x1": 323.2,
"r_y1": 482.5,
"r_x2": 323.2,
"r_y2": 473.7,
"r_x3": 318.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 347.2,
"t": 461.8,
"r": 351.6,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 470.6,
"r_x1": 351.6,
"r_y1": 470.6,
"r_x2": 351.6,
"r_y2": 461.8,
"r_x3": 347.2,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 394.1,
"t": 461.8,
"r": 402.9,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.6,
"r_x1": 402.9,
"r_y1": 470.6,
"r_x2": 402.9,
"r_y2": 461.8,
"r_x3": 394.1,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 441.0,
"t": 461.8,
"r": 449.4,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 470.6,
"r_x1": 449.4,
"r_y1": 470.6,
"r_x2": 449.4,
"r_y2": 461.8,
"r_x3": 441.0,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 487.8,
"t": 461.8,
"r": 496.6,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 470.6,
"r_x1": 496.6,
"r_y1": 470.6,
"r_x2": 496.6,
"r_y2": 461.8,
"r_x3": 487.8,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 347.2,
"t": 473.7,
"r": 356.0,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 482.5,
"r_x1": 356.0,
"r_y1": 482.5,
"r_x2": 356.0,
"r_y2": 473.7,
"r_x3": 347.2,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 394.1,
"t": 473.7,
"r": 402.9,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.5,
"r_x1": 402.9,
"r_y1": 482.5,
"r_x2": 402.9,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 441.0,
"t": 473.7,
"r": 449.7,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 482.5,
"r_x1": 449.7,
"r_y1": 482.5,
"r_x2": 449.7,
"r_y2": 473.7,
"r_x3": 441.0,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 487.8,
"t": 473.7,
"r": 496.6,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 482.5,
"r_x1": 496.6,
"r_y1": 482.5,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 347.2,
"t": 485.1,
"r": 356.0,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 493.9,
"r_x1": 356.0,
"r_y1": 493.9,
"r_x2": 356.0,
"r_y2": 485.1,
"r_x3": 347.2,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 394.1,
"t": 485.1,
"r": 402.9,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.9,
"r_x1": 402.9,
"r_y1": 493.9,
"r_x2": 402.9,
"r_y2": 485.1,
"r_x3": 394.1,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 441.0,
"t": 485.1,
"r": 449.7,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 493.9,
"r_x1": 449.7,
"r_y1": 493.9,
"r_x2": 449.7,
"r_y2": 485.1,
"r_x3": 441.0,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 487.8,
"t": 485.1,
"r": 496.6,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 493.9,
"r_x1": 496.6,
"r_y1": 493.9,
"r_x2": 496.6,
"r_y2": 485.1,
"r_x3": 487.8,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 366.7,
"t": 449.1,
"r": 372.7,
"b": 459.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.3,
"r_x1": 372.7,
"r_y1": 459.3,
"r_x2": 372.7,
"r_y2": 449.1,
"r_x3": 366.7,
"r_y3": 449.1,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 331.9,
"t": 473.3,
"r": 337.9,
"b": 483.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.5,
"r_x1": 337.9,
"r_y1": 483.5,
"r_x2": 337.9,
"r_y2": 473.3,
"r_x3": 331.9,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 459.9,
"t": 437.6,
"r": 465.9,
"b": 447.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.9,
"r_y0": 447.7,
"r_x1": 465.9,
"r_y1": 447.7,
"r_x2": 465.9,
"r_y2": 437.6,
"r_x3": 459.9,
"r_y3": 437.6,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 11,
"page_no": 0,
"cluster": {
"id": 11,
"label": "table",
"bbox": {
"l": 315.7,
"t": 433.8,
"r": 536.8,
"b": 496.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.81,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 446.5,
"r_x1": 351.6,
"r_y1": 446.5,
"r_x2": 351.6,
"r_y2": 437.7,
"r_x3": 347.2,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.9,
"r_y0": 446.5,
"r_x1": 323.3,
"r_y1": 446.5,
"r_x2": 323.3,
"r_y2": 437.7,
"r_x3": 318.9,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.5,
"r_x1": 398.5,
"r_y1": 446.5,
"r_x2": 398.5,
"r_y2": 437.7,
"r_x3": 394.1,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 458.3,
"r_x1": 323.2,
"r_y1": 458.3,
"r_x2": 323.2,
"r_y2": 449.5,
"r_x3": 318.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 458.3,
"r_x1": 351.6,
"r_y1": 458.3,
"r_x2": 351.6,
"r_y2": 449.5,
"r_x3": 347.2,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.3,
"r_x1": 398.5,
"r_y1": 458.3,
"r_x2": 398.5,
"r_y2": 449.5,
"r_x3": 394.1,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 458.3,
"r_x1": 445.4,
"r_y1": 458.3,
"r_x2": 445.4,
"r_y2": 449.5,
"r_x3": 441.0,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 458.3,
"r_x1": 492.2,
"r_y1": 458.3,
"r_x2": 492.2,
"r_y2": 449.5,
"r_x3": 487.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 482.5,
"r_x1": 323.2,
"r_y1": 482.5,
"r_x2": 323.2,
"r_y2": 473.7,
"r_x3": 318.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 470.6,
"r_x1": 351.6,
"r_y1": 470.6,
"r_x2": 351.6,
"r_y2": 461.8,
"r_x3": 347.2,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.6,
"r_x1": 402.9,
"r_y1": 470.6,
"r_x2": 402.9,
"r_y2": 461.8,
"r_x3": 394.1,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 470.6,
"r_x1": 449.4,
"r_y1": 470.6,
"r_x2": 449.4,
"r_y2": 461.8,
"r_x3": 441.0,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 470.6,
"r_x1": 496.6,
"r_y1": 470.6,
"r_x2": 496.6,
"r_y2": 461.8,
"r_x3": 487.8,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 482.5,
"r_x1": 356.0,
"r_y1": 482.5,
"r_x2": 356.0,
"r_y2": 473.7,
"r_x3": 347.2,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.5,
"r_x1": 402.9,
"r_y1": 482.5,
"r_x2": 402.9,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 482.5,
"r_x1": 449.7,
"r_y1": 482.5,
"r_x2": 449.7,
"r_y2": 473.7,
"r_x3": 441.0,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 482.5,
"r_x1": 496.6,
"r_y1": 482.5,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 493.9,
"r_x1": 356.0,
"r_y1": 493.9,
"r_x2": 356.0,
"r_y2": 485.1,
"r_x3": 347.2,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.9,
"r_x1": 402.9,
"r_y1": 493.9,
"r_x2": 402.9,
"r_y2": 485.1,
"r_x3": 394.1,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 493.9,
"r_x1": 449.7,
"r_y1": 493.9,
"r_x2": 449.7,
"r_y2": 485.1,
"r_x3": 441.0,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 493.9,
"r_x1": 496.6,
"r_y1": 493.9,
"r_x2": 496.6,
"r_y2": 485.1,
"r_x3": 487.8,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.3,
"r_x1": 372.7,
"r_y1": 459.3,
"r_x2": 372.7,
"r_y2": 449.1,
"r_x3": 366.7,
"r_y3": 449.1,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.5,
"r_x1": 337.9,
"r_y1": 483.5,
"r_x2": 337.9,
"r_y2": 473.3,
"r_x3": 331.9,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.9,
"r_y0": 447.7,
"r_x1": 465.9,
"r_y1": 447.7,
"r_x2": 465.9,
"r_y2": 437.6,
"r_x3": 459.9,
"r_y3": 437.6,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 62,
"label": "text",
"bbox": {
"l": 347.2,
"t": 437.7,
"r": 351.6,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 446.5,
"r_x1": 351.6,
"r_y1": 446.5,
"r_x2": 351.6,
"r_y2": 437.7,
"r_x3": 347.2,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 318.9,
"t": 437.7,
"r": 323.3,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.9,
"r_y0": 446.5,
"r_x1": 323.3,
"r_y1": 446.5,
"r_x2": 323.3,
"r_y2": 437.7,
"r_x3": 318.9,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 394.1,
"t": 437.7,
"r": 398.5,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 446.5,
"r_x1": 398.5,
"r_y1": 446.5,
"r_x2": 398.5,
"r_y2": 437.7,
"r_x3": 394.1,
"r_y3": 437.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 318.8,
"t": 449.5,
"r": 323.2,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 458.3,
"r_x1": 323.2,
"r_y1": 458.3,
"r_x2": 323.2,
"r_y2": 449.5,
"r_x3": 318.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 347.2,
"t": 449.5,
"r": 351.6,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 458.3,
"r_x1": 351.6,
"r_y1": 458.3,
"r_x2": 351.6,
"r_y2": 449.5,
"r_x3": 347.2,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 394.1,
"t": 449.5,
"r": 398.5,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 458.3,
"r_x1": 398.5,
"r_y1": 458.3,
"r_x2": 398.5,
"r_y2": 449.5,
"r_x3": 394.1,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 441.0,
"t": 449.5,
"r": 445.4,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 458.3,
"r_x1": 445.4,
"r_y1": 458.3,
"r_x2": 445.4,
"r_y2": 449.5,
"r_x3": 441.0,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 487.8,
"t": 449.5,
"r": 492.2,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 458.3,
"r_x1": 492.2,
"r_y1": 458.3,
"r_x2": 492.2,
"r_y2": 449.5,
"r_x3": 487.8,
"r_y3": 449.5,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 318.8,
"t": 473.7,
"r": 323.2,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.8,
"r_y0": 482.5,
"r_x1": 323.2,
"r_y1": 482.5,
"r_x2": 323.2,
"r_y2": 473.7,
"r_x3": 318.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 347.2,
"t": 461.8,
"r": 351.6,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 470.6,
"r_x1": 351.6,
"r_y1": 470.6,
"r_x2": 351.6,
"r_y2": 461.8,
"r_x3": 347.2,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 394.1,
"t": 461.8,
"r": 402.9,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 470.6,
"r_x1": 402.9,
"r_y1": 470.6,
"r_x2": 402.9,
"r_y2": 461.8,
"r_x3": 394.1,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 441.0,
"t": 461.8,
"r": 449.4,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 470.6,
"r_x1": 449.4,
"r_y1": 470.6,
"r_x2": 449.4,
"r_y2": 461.8,
"r_x3": 441.0,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 487.8,
"t": 461.8,
"r": 496.6,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 470.6,
"r_x1": 496.6,
"r_y1": 470.6,
"r_x2": 496.6,
"r_y2": 461.8,
"r_x3": 487.8,
"r_y3": 461.8,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 347.2,
"t": 473.7,
"r": 356.0,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 482.5,
"r_x1": 356.0,
"r_y1": 482.5,
"r_x2": 356.0,
"r_y2": 473.7,
"r_x3": 347.2,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 394.1,
"t": 473.7,
"r": 402.9,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 482.5,
"r_x1": 402.9,
"r_y1": 482.5,
"r_x2": 402.9,
"r_y2": 473.7,
"r_x3": 394.1,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 441.0,
"t": 473.7,
"r": 449.7,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 482.5,
"r_x1": 449.7,
"r_y1": 482.5,
"r_x2": 449.7,
"r_y2": 473.7,
"r_x3": 441.0,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 487.8,
"t": 473.7,
"r": 496.6,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 482.5,
"r_x1": 496.6,
"r_y1": 482.5,
"r_x2": 496.6,
"r_y2": 473.7,
"r_x3": 487.8,
"r_y3": 473.7,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 347.2,
"t": 485.1,
"r": 356.0,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.2,
"r_y0": 493.9,
"r_x1": 356.0,
"r_y1": 493.9,
"r_x2": 356.0,
"r_y2": 485.1,
"r_x3": 347.2,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 394.1,
"t": 485.1,
"r": 402.9,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.1,
"r_y0": 493.9,
"r_x1": 402.9,
"r_y1": 493.9,
"r_x2": 402.9,
"r_y2": 485.1,
"r_x3": 394.1,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 441.0,
"t": 485.1,
"r": 449.7,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.0,
"r_y0": 493.9,
"r_x1": 449.7,
"r_y1": 493.9,
"r_x2": 449.7,
"r_y2": 485.1,
"r_x3": 441.0,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 487.8,
"t": 485.1,
"r": 496.6,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 487.8,
"r_y0": 493.9,
"r_x1": 496.6,
"r_y1": 493.9,
"r_x2": 496.6,
"r_y2": 485.1,
"r_x3": 487.8,
"r_y3": 485.1,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 366.7,
"t": 449.1,
"r": 372.7,
"b": 459.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 366.7,
"r_y0": 459.3,
"r_x1": 372.7,
"r_y1": 459.3,
"r_x2": 372.7,
"r_y2": 449.1,
"r_x3": 366.7,
"r_y3": 449.1,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 331.9,
"t": 473.3,
"r": 337.9,
"b": 483.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.9,
"r_y0": 483.5,
"r_x1": 337.9,
"r_y1": 483.5,
"r_x2": 337.9,
"r_y2": 473.3,
"r_x3": 331.9,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 459.9,
"t": 437.6,
"r": 465.9,
"b": 447.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.9,
"r_y0": 447.7,
"r_x1": 465.9,
"r_y1": 447.7,
"r_x2": 465.9,
"r_y2": 437.6,
"r_x3": 459.9,
"r_y3": 437.6,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"lcel",
"lcel",
"lcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 5,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 347.2,
"t": 437.7,
"r": 351.6,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 4,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 5,
"text": "1 2 1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 318.9,
"t": 437.7,
"r": 323.3,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 318.8,
"t": 449.5,
"r": 323.2,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.2,
"t": 449.1,
"r": 372.7,
"b": 459.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "4 3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 449.5,
"r": 398.5,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 441.0,
"t": 449.5,
"r": 445.4,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.8,
"t": 449.5,
"r": 492.2,
"b": 458.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 318.8,
"t": 473.7,
"r": 323.2,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "8 2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.2,
"t": 461.8,
"r": 351.6,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 461.8,
"r": 402.9,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "10",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 441.0,
"t": 461.8,
"r": 449.4,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "11",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.8,
"t": 461.8,
"r": 496.6,
"b": 470.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "12",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.2,
"t": 473.7,
"r": 356.0,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "13",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 473.7,
"r": 402.9,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "14",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 441.0,
"t": 473.7,
"r": 449.7,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "15",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.8,
"t": 473.7,
"r": 496.6,
"b": 482.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "16",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 347.2,
"t": 485.1,
"r": 356.0,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "17",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.1,
"t": 485.1,
"r": 402.9,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "18",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 441.0,
"t": 485.1,
"r": 449.7,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "19",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 487.8,
"t": 485.1,
"r": 496.6,
"b": 493.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "20",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "picture",
"id": 16,
"page_no": 0,
"cluster": {
"id": 16,
"label": "picture",
"bbox": {
"l": 315.7,
"t": 228.7,
"r": 537.1,
"b": 302.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.61,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.9,
"r_y0": 245.5,
"r_x1": 458.0,
"r_y1": 245.5,
"r_x2": 458.0,
"r_y2": 235.3,
"r_x3": 451.9,
"r_y3": 235.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.5,
"r_x1": 337.2,
"r_y1": 279.5,
"r_x2": 337.2,
"r_y2": 269.4,
"r_x3": 331.2,
"r_y3": 269.4,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.0,
"r_y0": 262.8,
"r_x1": 390.0,
"r_y1": 262.8,
"r_x2": 390.0,
"r_y2": 252.7,
"r_x3": 384.0,
"r_y3": 252.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 83,
"label": "text",
"bbox": {
"l": 451.9,
"t": 235.3,
"r": 458.0,
"b": 245.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.9,
"r_y0": 245.5,
"r_x1": 458.0,
"r_y1": 245.5,
"r_x2": 458.0,
"r_y2": 235.3,
"r_x3": 451.9,
"r_y3": 235.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 331.2,
"t": 269.4,
"r": 337.2,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.5,
"r_x1": 337.2,
"r_y1": 279.5,
"r_x2": 337.2,
"r_y2": 269.4,
"r_x3": 331.2,
"r_y3": 269.4,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 384.0,
"t": 252.7,
"r": 390.0,
"b": 262.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.0,
"r_y0": 262.8,
"r_x1": 390.0,
"r_y1": 262.8,
"r_x2": 390.0,
"r_y2": 252.7,
"r_x3": 384.0,
"r_y3": 252.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 15,
"page_no": 0,
"cluster": {
"id": 15,
"label": "table",
"bbox": {
"l": 315.7,
"t": 228.7,
"r": 537.1,
"b": 302.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.65,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.9,
"r_y0": 245.5,
"r_x1": 458.0,
"r_y1": 245.5,
"r_x2": 458.0,
"r_y2": 235.3,
"r_x3": 451.9,
"r_y3": 235.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.5,
"r_x1": 337.2,
"r_y1": 279.5,
"r_x2": 337.2,
"r_y2": 269.4,
"r_x3": 331.2,
"r_y3": 269.4,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.0,
"r_y0": 262.8,
"r_x1": 390.0,
"r_y1": 262.8,
"r_x2": 390.0,
"r_y2": 252.7,
"r_x3": 384.0,
"r_y3": 252.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 83,
"label": "text",
"bbox": {
"l": 451.9,
"t": 235.3,
"r": 458.0,
"b": 245.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 451.9,
"r_y0": 245.5,
"r_x1": 458.0,
"r_y1": 245.5,
"r_x2": 458.0,
"r_y2": 235.3,
"r_x3": 451.9,
"r_y3": 235.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 331.2,
"t": 269.4,
"r": 337.2,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.2,
"r_y0": 279.5,
"r_x1": 337.2,
"r_y1": 279.5,
"r_x2": 337.2,
"r_y2": 269.4,
"r_x3": 331.2,
"r_y3": 269.4,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 384.0,
"t": 252.7,
"r": 390.0,
"b": 262.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.0,
"r_y0": 262.8,
"r_x1": 390.0,
"r_y1": 262.8,
"r_x2": 390.0,
"r_y2": 252.7,
"r_x3": 384.0,
"r_y3": 252.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"ucel",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"ucel",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 1,
"num_cols": 1,
"table_cells": [
{
"bbox": {
"l": 451.9,
"t": 235.3,
"r": 458.0,
"b": 245.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "1",
"column_header": true,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 6,
"page_no": 0,
"cluster": {
"id": 6,
"label": "caption",
"bbox": {
"l": 308.9,
"t": 514.5,
"r": 545.1,
"b": 559.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.92,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 523.4,
"r_x1": 345.7,
"r_y1": 523.4,
"r_x2": 345.7,
"r_y2": 514.5,
"r_x3": 308.9,
"r_y3": 514.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 1:",
"orig": "Figure 1:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 353.2,
"r_y0": 523.4,
"r_x1": 545.1,
"r_y1": 523.4,
"r_x2": 545.1,
"r_y2": 514.5,
"r_x3": 353.2,
"r_y3": 514.5,
"coord_origin": "TOPLEFT"
},
"text": "Picture of a table with subtle, complex features",
"orig": "Picture of a table with subtle, complex features",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 535.4,
"r_x1": 545.1,
"r_y1": 535.4,
"r_x2": 545.1,
"r_y2": 526.5,
"r_x3": 308.9,
"r_y3": 526.5,
"coord_origin": "TOPLEFT"
},
"text": "such as (1) multi-column headers, (2) cell with multi-row",
"orig": "such as (1) multi-column headers, (2) cell with multi-row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 547.3,
"r_x1": 545.1,
"r_y1": 547.3,
"r_x2": 545.1,
"r_y2": 538.4,
"r_x3": 308.9,
"r_y3": 538.4,
"coord_origin": "TOPLEFT"
},
"text": "text and (3) cells with no content. Image from PubTabNet",
"orig": "text and (3) cells with no content. Image from PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 559.3,
"r_x1": 505.7,
"r_y1": 559.3,
"r_x2": 505.7,
"r_y2": 550.4,
"r_x3": 308.9,
"r_y3": 550.4,
"coord_origin": "TOPLEFT"
},
"text": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.",
"orig": "evaluation set, filename: \u2018PMC2944238 004 02\u2019.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 1: Picture of a table with subtle, complex features such as (1) multi-column headers, (2) cell with multi-row text and (3) cells with no content. Image from PubTabNet evaluation set, filename: 'PMC2944238 004 02'."
},
{
"label": "text",
"id": 0,
"page_no": 0,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 308.9,
"t": 584.4,
"r": 545.1,
"b": 665.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 593.3,
"r_x1": 545.1,
"r_y1": 593.3,
"r_x2": 545.1,
"r_y2": 584.4,
"r_x3": 320.8,
"r_y3": 584.4,
"coord_origin": "TOPLEFT"
},
"text": "Recently, significant progress has been made with vi-",
"orig": "Recently, significant progress has been made with vi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 605.3,
"r_x1": 545.1,
"r_y1": 605.3,
"r_x2": 545.1,
"r_y2": 596.4,
"r_x3": 308.9,
"r_y3": 596.4,
"coord_origin": "TOPLEFT"
},
"text": "sion based approaches to extract tables in documents. For",
"orig": "sion based approaches to extract tables in documents. For",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 617.2,
"r_x1": 545.1,
"r_y1": 617.2,
"r_x2": 545.1,
"r_y2": 608.3,
"r_x3": 308.9,
"r_y3": 608.3,
"coord_origin": "TOPLEFT"
},
"text": "the sake of completeness, the issue of table extraction from",
"orig": "the sake of completeness, the issue of table extraction from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 629.2,
"r_x1": 545.1,
"r_y1": 629.2,
"r_x2": 545.1,
"r_y2": 620.3,
"r_x3": 308.9,
"r_y3": 620.3,
"coord_origin": "TOPLEFT"
},
"text": "documents is typically decomposed into two separate chal-",
"orig": "documents is typically decomposed into two separate chal-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 641.1,
"r_x1": 353.7,
"r_y1": 641.1,
"r_x2": 353.7,
"r_y2": 632.2,
"r_x3": 308.9,
"r_y3": 632.2,
"coord_origin": "TOPLEFT"
},
"text": "lenges, i.e.",
"orig": "lenges, i.e.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 362.1,
"r_y0": 641.1,
"r_x1": 374.7,
"r_y1": 641.1,
"r_x2": 374.7,
"r_y2": 632.2,
"r_x3": 362.1,
"r_y3": 632.2,
"coord_origin": "TOPLEFT"
},
"text": "(1)",
"orig": "(1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 377.4,
"r_y0": 641.1,
"r_x1": 545.1,
"r_y1": 641.1,
"r_x2": 545.1,
"r_y2": 632.2,
"r_x3": 377.4,
"r_y3": 632.2,
"coord_origin": "TOPLEFT"
},
"text": "finding the location of the table(s) on a",
"orig": "finding the location of the table(s) on a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 653.1,
"r_x1": 545.1,
"r_y1": 653.1,
"r_x2": 545.1,
"r_y2": 644.2,
"r_x3": 308.9,
"r_y3": 644.2,
"coord_origin": "TOPLEFT"
},
"text": "document-page and (2) finding the structure of a given table",
"orig": "document-page and (2) finding the structure of a given table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 665.0,
"r_x1": 375.6,
"r_y1": 665.0,
"r_x2": 375.6,
"r_y2": 656.1,
"r_x3": 308.9,
"r_y3": 656.1,
"coord_origin": "TOPLEFT"
},
"text": "in the document.",
"orig": "in the document.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Recently, significant progress has been made with vision based approaches to extract tables in documents. For the sake of completeness, the issue of table extraction from documents is typically decomposed into two separate challenges, i.e. (1) finding the location of the table(s) on a document-page and (2) finding the structure of a given table in the document."
},
{
"label": "text",
"id": 3,
"page_no": 0,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 308.9,
"t": 668.4,
"r": 545.1,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 677.3,
"r_x1": 545.1,
"r_y1": 677.3,
"r_x2": 545.1,
"r_y2": 668.4,
"r_x3": 320.8,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "The first problem is called table-location and has been",
"orig": "The first problem is called table-location and has been",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 689.2,
"r_x1": 545.1,
"r_y1": 689.2,
"r_x2": 545.1,
"r_y2": 680.3,
"r_x3": 308.9,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-",
"orig": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 308.9,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "of-the-art object-detection networks (e.g. YOLO and later",
"orig": "of-the-art object-detection networks (e.g. YOLO and later",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 545.1,
"r_y1": 713.2,
"r_x2": 545.1,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "on Mask-RCNN [9]). For all practical purposes, it can be",
"orig": "on Mask-RCNN [9]). For all practical purposes, it can be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The first problem is called table-location and has been previously addressed [30, 38, 19, 21, 23, 26, 8] with stateof-the-art object-detection networks (e.g. YOLO and later on Mask-RCNN [9]). For all practical purposes, it can be"
}
],
"headers": [
{
"label": "page_footer",
"id": 12,
"page_no": 0,
"cluster": {
"id": 12,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.8,
"cells": [
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1"
},
{
"label": "page_header",
"id": 9,
"page_no": 0,
"cluster": {
"id": 9,
"label": "page_header",
"bbox": {
"l": 18.3,
"t": 207.8,
"r": 36.3,
"b": 560.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 18.3,
"r_y0": 560.0,
"r_x1": 36.3,
"r_y1": 560.0,
"r_x2": 36.3,
"r_y2": 207.8,
"r_x3": 18.3,
"r_y3": 207.8,
"coord_origin": "TOPLEFT"
},
"text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022",
"orig": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "arXiv:2203.01017v2 [cs.CV] 11 Mar 2022"
}
]
}
},
{
"page_no": 1,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.1,
"r_x1": 286.4,
"r_y1": 84.1,
"r_x2": 286.4,
"r_y2": 75.2,
"r_x3": 50.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "considered as a solved problem, given enough ground-truth",
"orig": "considered as a solved problem, given enough ground-truth",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 96.1,
"r_x1": 112.6,
"r_y1": 96.1,
"r_x2": 112.6,
"r_y2": 87.2,
"r_x3": 50.1,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "data to train on.",
"orig": "data to train on.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 108.5,
"r_x1": 286.4,
"r_y1": 108.5,
"r_x2": 286.4,
"r_y2": 99.6,
"r_x3": 62.1,
"r_y3": 99.6,
"coord_origin": "TOPLEFT"
},
"text": "The second problem is called table-structure decompo-",
"orig": "The second problem is called table-structure decompo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 120.4,
"r_x1": 74.7,
"r_y1": 120.4,
"r_x2": 74.7,
"r_y2": 111.5,
"r_x3": 50.1,
"r_y3": 111.5,
"coord_origin": "TOPLEFT"
},
"text": "sition.",
"orig": "sition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.3,
"r_y0": 120.4,
"r_x1": 286.4,
"r_y1": 120.4,
"r_x2": 286.4,
"r_y2": 111.5,
"r_x3": 81.3,
"r_y3": 111.5,
"coord_origin": "TOPLEFT"
},
"text": "The latter is a long standing problem in the com-",
"orig": "The latter is a long standing problem in the com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 132.4,
"r_x1": 286.4,
"r_y1": 132.4,
"r_x2": 286.4,
"r_y2": 123.5,
"r_x3": 50.1,
"r_y3": 123.5,
"coord_origin": "TOPLEFT"
},
"text": "munity of document understanding [6, 4, 14]. Contrary to",
"orig": "munity of document understanding [6, 4, 14]. Contrary to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 144.3,
"r_x1": 286.4,
"r_y1": 144.3,
"r_x2": 286.4,
"r_y2": 135.4,
"r_x3": 50.1,
"r_y3": 135.4,
"coord_origin": "TOPLEFT"
},
"text": "the table-location problem, there are no commonly used ap-",
"orig": "the table-location problem, there are no commonly used ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 156.3,
"r_x1": 286.4,
"r_y1": 156.3,
"r_x2": 286.4,
"r_y2": 147.4,
"r_x3": 50.1,
"r_y3": 147.4,
"coord_origin": "TOPLEFT"
},
"text": "proaches that can easily be re-purposed to solve this prob-",
"orig": "proaches that can easily be re-purposed to solve this prob-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 168.3,
"r_x1": 286.4,
"r_y1": 168.3,
"r_x2": 286.4,
"r_y2": 159.3,
"r_x3": 50.1,
"r_y3": 159.3,
"coord_origin": "TOPLEFT"
},
"text": "lem. Lately, a set of new model-architectures has been pro-",
"orig": "lem. Lately, a set of new model-architectures has been pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 180.2,
"r_x1": 286.4,
"r_y1": 180.2,
"r_x2": 286.4,
"r_y2": 171.3,
"r_x3": 50.1,
"r_y3": 171.3,
"coord_origin": "TOPLEFT"
},
"text": "posed by the community to address table-structure decom-",
"orig": "posed by the community to address table-structure decom-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 192.2,
"r_x1": 286.4,
"r_y1": 192.2,
"r_x2": 286.4,
"r_y2": 183.3,
"r_x3": 50.1,
"r_y3": 183.3,
"coord_origin": "TOPLEFT"
},
"text": "position [37, 36, 18, 20]. All these models have some weak-",
"orig": "position [37, 36, 18, 20]. All these models have some weak-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 204.1,
"r_x1": 286.4,
"r_y1": 204.1,
"r_x2": 286.4,
"r_y2": 195.2,
"r_x3": 50.1,
"r_y3": 195.2,
"coord_origin": "TOPLEFT"
},
"text": "nesses (see Sec. 2). The common denominator here is the",
"orig": "nesses (see Sec. 2). The common denominator here is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 216.1,
"r_x1": 286.4,
"r_y1": 216.1,
"r_x2": 286.4,
"r_y2": 207.2,
"r_x3": 50.1,
"r_y3": 207.2,
"coord_origin": "TOPLEFT"
},
"text": "reliance on textual features and/or the inability to provide",
"orig": "reliance on textual features and/or the inability to provide",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 228.0,
"r_x1": 278.7,
"r_y1": 228.0,
"r_x2": 278.7,
"r_y2": 219.1,
"r_x3": 50.1,
"r_y3": 219.1,
"coord_origin": "TOPLEFT"
},
"text": "the bounding box of each table-cell in the original image.",
"orig": "the bounding box of each table-cell in the original image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 240.4,
"r_x1": 286.4,
"r_y1": 240.4,
"r_x2": 286.4,
"r_y2": 231.5,
"r_x3": 62.1,
"r_y3": 231.5,
"coord_origin": "TOPLEFT"
},
"text": "In this paper, we want to address these weaknesses and",
"orig": "In this paper, we want to address these weaknesses and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 252.4,
"r_x1": 286.4,
"r_y1": 252.4,
"r_x2": 286.4,
"r_y2": 243.5,
"r_x3": 50.1,
"r_y3": 243.5,
"coord_origin": "TOPLEFT"
},
"text": "present a robust table-structure decomposition algorithm.",
"orig": "present a robust table-structure decomposition algorithm.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 264.3,
"r_x1": 286.4,
"r_y1": 264.3,
"r_x2": 286.4,
"r_y2": 255.4,
"r_x3": 50.1,
"r_y3": 255.4,
"coord_origin": "TOPLEFT"
},
"text": "The design criteria for our model are the following. First,",
"orig": "The design criteria for our model are the following. First,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 276.3,
"r_x1": 286.4,
"r_y1": 276.3,
"r_x2": 286.4,
"r_y2": 267.4,
"r_x3": 50.1,
"r_y3": 267.4,
"coord_origin": "TOPLEFT"
},
"text": "we want our algorithm to be language agnostic. In this way,",
"orig": "we want our algorithm to be language agnostic. In this way,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 288.3,
"r_x1": 286.4,
"r_y1": 288.3,
"r_x2": 286.4,
"r_y2": 279.4,
"r_x3": 50.1,
"r_y3": 279.4,
"coord_origin": "TOPLEFT"
},
"text": "we can obtain the structure of any table, irregardless of the",
"orig": "we can obtain the structure of any table, irregardless of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 300.2,
"r_x1": 88.6,
"r_y1": 300.2,
"r_x2": 88.6,
"r_y2": 291.3,
"r_x3": 50.1,
"r_y3": 291.3,
"coord_origin": "TOPLEFT"
},
"text": "language.",
"orig": "language.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 95.5,
"r_y0": 300.2,
"r_x1": 286.4,
"r_y1": 300.2,
"r_x2": 286.4,
"r_y2": 291.3,
"r_x3": 95.5,
"r_y3": 291.3,
"coord_origin": "TOPLEFT"
},
"text": "Second, we want our algorithm to leverage as",
"orig": "Second, we want our algorithm to leverage as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 312.2,
"r_x1": 286.4,
"r_y1": 312.2,
"r_x2": 286.4,
"r_y2": 303.3,
"r_x3": 50.1,
"r_y3": 303.3,
"coord_origin": "TOPLEFT"
},
"text": "much data as possible from the original PDF document. For",
"orig": "much data as possible from the original PDF document. For",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 324.1,
"r_x1": 286.4,
"r_y1": 324.1,
"r_x2": 286.4,
"r_y2": 315.2,
"r_x3": 50.1,
"r_y3": 315.2,
"coord_origin": "TOPLEFT"
},
"text": "programmatic PDF documents, the text-cells can often be",
"orig": "programmatic PDF documents, the text-cells can often be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 336.1,
"r_x1": 286.4,
"r_y1": 336.1,
"r_x2": 286.4,
"r_y2": 327.2,
"r_x3": 50.1,
"r_y3": 327.2,
"coord_origin": "TOPLEFT"
},
"text": "extracted much faster and with higher accuracy compared",
"orig": "extracted much faster and with higher accuracy compared",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 348.0,
"r_x1": 286.4,
"r_y1": 348.0,
"r_x2": 286.4,
"r_y2": 339.1,
"r_x3": 50.1,
"r_y3": 339.1,
"coord_origin": "TOPLEFT"
},
"text": "to OCR methods. Last but not least, we want to have a di-",
"orig": "to OCR methods. Last but not least, we want to have a di-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 360.0,
"r_x1": 286.4,
"r_y1": 360.0,
"r_x2": 286.4,
"r_y2": 351.1,
"r_x3": 50.1,
"r_y3": 351.1,
"coord_origin": "TOPLEFT"
},
"text": "rect link between the table-cell and its bounding box in the",
"orig": "rect link between the table-cell and its bounding box in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 371.9,
"r_x1": 77.0,
"r_y1": 371.9,
"r_x2": 77.0,
"r_y2": 363.0,
"r_x3": 50.1,
"r_y3": 363.0,
"coord_origin": "TOPLEFT"
},
"text": "image.",
"orig": "image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 384.4,
"r_x1": 286.4,
"r_y1": 384.4,
"r_x2": 286.4,
"r_y2": 375.4,
"r_x3": 62.1,
"r_y3": 375.4,
"coord_origin": "TOPLEFT"
},
"text": "To meet the design criteria listed above, we developed a",
"orig": "To meet the design criteria listed above, we developed a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 396.3,
"r_x1": 121.0,
"r_y1": 396.3,
"r_x2": 121.0,
"r_y2": 387.4,
"r_x3": 50.1,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "new model called",
"orig": "new model called",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 123.9,
"r_y0": 396.2,
"r_x1": 179.7,
"r_y1": 396.2,
"r_x2": 179.7,
"r_y2": 387.3,
"r_x3": 123.9,
"r_y3": 387.3,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.6,
"r_y0": 396.3,
"r_x1": 286.4,
"r_y1": 396.3,
"r_x2": 286.4,
"r_y2": 387.4,
"r_x3": 182.6,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "and a synthetically gener-",
"orig": "and a synthetically gener-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 408.3,
"r_x1": 181.8,
"r_y1": 408.3,
"r_x2": 181.8,
"r_y2": 399.4,
"r_x3": 50.1,
"r_y3": 399.4,
"coord_origin": "TOPLEFT"
},
"text": "ated table structure dataset called",
"orig": "ated table structure dataset called",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.1,
"r_y0": 408.2,
"r_x1": 240.2,
"r_y1": 408.2,
"r_x2": 240.2,
"r_y2": 399.2,
"r_x3": 184.1,
"r_y3": 399.2,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 240.2,
"r_y0": 408.3,
"r_x1": 286.4,
"r_y1": 408.3,
"r_x2": 286.4,
"r_y2": 399.4,
"r_x3": 240.2,
"r_y3": 399.4,
"coord_origin": "TOPLEFT"
},
"text": "$^{1}$. In partic-",
"orig": "$^{1}$. In partic-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 420.2,
"r_x1": 286.4,
"r_y1": 420.2,
"r_x2": 286.4,
"r_y2": 411.3,
"r_x3": 50.1,
"r_y3": 411.3,
"coord_origin": "TOPLEFT"
},
"text": "ular, our contributions in this work can be summarised as",
"orig": "ular, our contributions in this work can be summarised as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 432.2,
"r_x1": 82.5,
"r_y1": 432.2,
"r_x2": 82.5,
"r_y2": 423.3,
"r_x3": 50.1,
"r_y3": 423.3,
"coord_origin": "TOPLEFT"
},
"text": "follows:",
"orig": "follows:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 453.5,
"r_x1": 70.7,
"r_y1": 453.5,
"r_x2": 70.7,
"r_y2": 444.6,
"r_x3": 61.6,
"r_y3": 444.6,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.0,
"r_y0": 453.5,
"r_x1": 117.1,
"r_y1": 453.5,
"r_x2": 117.1,
"r_y2": 444.6,
"r_x3": 73.0,
"r_y3": 444.6,
"coord_origin": "TOPLEFT"
},
"text": "We propose",
"orig": "We propose",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.6,
"r_y0": 453.4,
"r_x1": 175.4,
"r_y1": 453.4,
"r_x2": 175.4,
"r_y2": 444.4,
"r_x3": 119.6,
"r_y3": 444.4,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.4,
"r_y0": 453.5,
"r_x1": 286.4,
"r_y1": 453.5,
"r_x2": 286.4,
"r_y2": 444.6,
"r_x3": 175.4,
"r_y3": 444.6,
"coord_origin": "TOPLEFT"
},
"text": ", a transformer based model",
"orig": ", a transformer based model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 465.4,
"r_x1": 286.4,
"r_y1": 465.4,
"r_x2": 286.4,
"r_y2": 456.5,
"r_x3": 70.0,
"r_y3": 456.5,
"coord_origin": "TOPLEFT"
},
"text": "that predicts tables structure and bounding boxes for",
"orig": "that predicts tables structure and bounding boxes for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 477.4,
"r_x1": 286.4,
"r_y1": 477.4,
"r_x2": 286.4,
"r_y2": 468.5,
"r_x3": 70.0,
"r_y3": 468.5,
"coord_origin": "TOPLEFT"
},
"text": "the table content simultaneously in an end-to-end ap-",
"orig": "the table content simultaneously in an end-to-end ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 489.3,
"r_x1": 99.6,
"r_y1": 489.3,
"r_x2": 99.6,
"r_y2": 480.4,
"r_x3": 70.0,
"r_y3": 480.4,
"coord_origin": "TOPLEFT"
},
"text": "proach.",
"orig": "proach.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 511.1,
"r_x1": 71.6,
"r_y1": 511.1,
"r_x2": 71.6,
"r_y2": 502.2,
"r_x3": 61.6,
"r_y3": 502.2,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.1,
"r_y0": 511.1,
"r_x1": 196.1,
"r_y1": 511.1,
"r_x2": 196.1,
"r_y2": 502.2,
"r_x3": 74.1,
"r_y3": 502.2,
"coord_origin": "TOPLEFT"
},
"text": "Across all benchmark datasets",
"orig": "Across all benchmark datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.3,
"r_y0": 511.0,
"r_x1": 256.1,
"r_y1": 511.0,
"r_x2": 256.1,
"r_y2": 502.0,
"r_x3": 200.3,
"r_y3": 502.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 260.4,
"r_y0": 511.1,
"r_x1": 286.4,
"r_y1": 511.1,
"r_x2": 286.4,
"r_y2": 502.2,
"r_x3": 260.4,
"r_y3": 502.2,
"coord_origin": "TOPLEFT"
},
"text": "signif-",
"orig": "signif-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 523.0,
"r_x1": 286.4,
"r_y1": 523.0,
"r_x2": 286.4,
"r_y2": 514.1,
"r_x3": 70.0,
"r_y3": 514.1,
"coord_origin": "TOPLEFT"
},
"text": "icantly outperforms existing state-of-the-art metrics,",
"orig": "icantly outperforms existing state-of-the-art metrics,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 535.0,
"r_x1": 286.4,
"r_y1": 535.0,
"r_x2": 286.4,
"r_y2": 526.1,
"r_x3": 70.0,
"r_y3": 526.1,
"coord_origin": "TOPLEFT"
},
"text": "while being much more efficient in training and infer-",
"orig": "while being much more efficient in training and infer-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 546.9,
"r_x1": 161.7,
"r_y1": 546.9,
"r_x2": 161.7,
"r_y2": 538.0,
"r_x3": 70.0,
"r_y3": 538.0,
"coord_origin": "TOPLEFT"
},
"text": "ence to existing works.",
"orig": "ence to existing works.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 568.7,
"r_x1": 71.1,
"r_y1": 568.7,
"r_x2": 71.1,
"r_y2": 559.8,
"r_x3": 61.6,
"r_y3": 559.8,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.5,
"r_y0": 568.7,
"r_x1": 116.7,
"r_y1": 568.7,
"r_x2": 116.7,
"r_y2": 559.8,
"r_x3": 73.5,
"r_y3": 559.8,
"coord_origin": "TOPLEFT"
},
"text": "We present",
"orig": "We present",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 121.6,
"r_y0": 568.6,
"r_x1": 177.7,
"r_y1": 568.6,
"r_x2": 177.7,
"r_y2": 559.6,
"r_x3": 121.6,
"r_y3": 559.6,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.6,
"r_y0": 568.7,
"r_x1": 286.4,
"r_y1": 568.7,
"r_x2": 286.4,
"r_y2": 559.8,
"r_x3": 182.6,
"r_y3": 559.8,
"coord_origin": "TOPLEFT"
},
"text": "a synthetically generated",
"orig": "a synthetically generated",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 580.6,
"r_x1": 286.4,
"r_y1": 580.6,
"r_x2": 286.4,
"r_y2": 571.7,
"r_x3": 70.0,
"r_y3": 571.7,
"coord_origin": "TOPLEFT"
},
"text": "dataset, with various appearance styles and complex-",
"orig": "dataset, with various appearance styles and complex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 592.6,
"r_x1": 82.4,
"r_y1": 592.6,
"r_x2": 82.4,
"r_y2": 583.7,
"r_x3": 70.0,
"r_y3": 583.7,
"coord_origin": "TOPLEFT"
},
"text": "ity.",
"orig": "ity.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 614.3,
"r_x1": 72.3,
"r_y1": 614.3,
"r_x2": 72.3,
"r_y2": 605.4,
"r_x3": 61.6,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 75.0,
"r_y0": 614.3,
"r_x1": 286.4,
"r_y1": 614.3,
"r_x2": 286.4,
"r_y2": 605.4,
"r_x3": 75.0,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "An augmented dataset based on PubTabNet [37],",
"orig": "An augmented dataset based on PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 626.3,
"r_x1": 286.4,
"r_y1": 626.3,
"r_x2": 286.4,
"r_y2": 617.4,
"r_x3": 70.0,
"r_y3": 617.4,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet [36], and TableBank [17] with generated",
"orig": "FinTabNet [36], and TableBank [17] with generated",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 638.2,
"r_x1": 198.1,
"r_y1": 638.2,
"r_x2": 198.1,
"r_y2": 629.3,
"r_x3": 70.0,
"r_y3": 629.3,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth for reproducibility.",
"orig": "ground-truth for reproducibility.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 659.5,
"r_x1": 286.4,
"r_y1": 659.5,
"r_x2": 286.4,
"r_y2": 650.6,
"r_x3": 62.1,
"r_y3": 650.6,
"coord_origin": "TOPLEFT"
},
"text": "The paper is structured as follows. In Sec. 2, we give",
"orig": "The paper is structured as follows. In Sec. 2, we give",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 671.5,
"r_x1": 286.4,
"r_y1": 671.5,
"r_x2": 286.4,
"r_y2": 662.6,
"r_x3": 50.1,
"r_y3": 662.6,
"coord_origin": "TOPLEFT"
},
"text": "a brief overview of the current state-of-the-art. In Sec. 3,",
"orig": "a brief overview of the current state-of-the-art. In Sec. 3,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 683.4,
"r_x1": 286.4,
"r_y1": 683.4,
"r_x2": 286.4,
"r_y2": 674.5,
"r_x3": 50.1,
"r_y3": 674.5,
"coord_origin": "TOPLEFT"
},
"text": "we describe the datasets on which we train. In Sec. 4, we",
"orig": "we describe the datasets on which we train. In Sec. 4, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 695.4,
"r_x1": 286.4,
"r_y1": 695.4,
"r_x2": 286.4,
"r_y2": 686.5,
"r_x3": 50.1,
"r_y3": 686.5,
"coord_origin": "TOPLEFT"
},
"text": "introduce the TableFormer model-architecture and describe",
"orig": "introduce the TableFormer model-architecture and describe",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.0,
"r_y0": 712.7,
"r_x1": 183.7,
"r_y1": 712.7,
"r_x2": 183.7,
"r_y2": 705.6,
"r_x3": 61.0,
"r_y3": 705.6,
"coord_origin": "TOPLEFT"
},
"text": "$^{1}$https://github.com/IBM/SynthTabNet",
"orig": "$^{1}$https://github.com/IBM/SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 84.1,
"r_x1": 545.1,
"r_y1": 84.1,
"r_x2": 545.1,
"r_y2": 75.2,
"r_x3": 308.9,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "its results & performance in Sec. 5. As a conclusion, we de-",
"orig": "its results & performance in Sec. 5. As a conclusion, we de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 96.1,
"r_x1": 545.1,
"r_y1": 96.1,
"r_x2": 545.1,
"r_y2": 87.2,
"r_x3": 308.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "scribe how this new model-architecture can be re-purposed",
"orig": "scribe how this new model-architecture can be re-purposed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 108.0,
"r_x1": 508.1,
"r_y1": 108.0,
"r_x2": 508.1,
"r_y2": 99.1,
"r_x3": 308.9,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "for other tasks in the computer-vision community.",
"orig": "for other tasks in the computer-vision community.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 132.5,
"r_x1": 315.6,
"r_y1": 132.5,
"r_x2": 315.6,
"r_y2": 121.7,
"r_x3": 308.9,
"r_y3": 121.7,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 324.5,
"r_y0": 132.5,
"r_x1": 498.3,
"r_y1": 132.5,
"r_x2": 498.3,
"r_y2": 121.7,
"r_x3": 324.5,
"r_y3": 121.7,
"coord_origin": "TOPLEFT"
},
"text": "Previous work and State of the Art",
"orig": "Previous work and State of the Art",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 151.1,
"r_x1": 545.1,
"r_y1": 151.1,
"r_x2": 545.1,
"r_y2": 142.2,
"r_x3": 320.8,
"r_y3": 142.2,
"coord_origin": "TOPLEFT"
},
"text": "Identifying the structure of a table has been an outstand-",
"orig": "Identifying the structure of a table has been an outstand-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 163.1,
"r_x1": 545.1,
"r_y1": 163.1,
"r_x2": 545.1,
"r_y2": 154.2,
"r_x3": 308.9,
"r_y3": 154.2,
"coord_origin": "TOPLEFT"
},
"text": "ing problem in the document-parsing community, that mo-",
"orig": "ing problem in the document-parsing community, that mo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 175.0,
"r_x1": 522.6,
"r_y1": 175.0,
"r_x2": 522.6,
"r_y2": 166.1,
"r_x3": 308.9,
"r_y3": 166.1,
"coord_origin": "TOPLEFT"
},
"text": "tivates many organised public challenges [6, 4, 14].",
"orig": "tivates many organised public challenges [6, 4, 14].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 529.6,
"r_y0": 175.0,
"r_x1": 545.1,
"r_y1": 175.0,
"r_x2": 545.1,
"r_y2": 166.1,
"r_x3": 529.6,
"r_y3": 166.1,
"coord_origin": "TOPLEFT"
},
"text": "The",
"orig": "The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 187.0,
"r_x1": 545.1,
"r_y1": 187.0,
"r_x2": 545.1,
"r_y2": 178.1,
"r_x3": 308.9,
"r_y3": 178.1,
"coord_origin": "TOPLEFT"
},
"text": "difficulty of the problem can be attributed to a number of",
"orig": "difficulty of the problem can be attributed to a number of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 198.9,
"r_x1": 545.1,
"r_y1": 198.9,
"r_x2": 545.1,
"r_y2": 190.0,
"r_x3": 308.9,
"r_y3": 190.0,
"coord_origin": "TOPLEFT"
},
"text": "factors. First, there is a large variety in the shapes and sizes",
"orig": "factors. First, there is a large variety in the shapes and sizes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 210.9,
"r_x1": 347.0,
"r_y1": 210.9,
"r_x2": 347.0,
"r_y2": 202.0,
"r_x3": 308.9,
"r_y3": 202.0,
"coord_origin": "TOPLEFT"
},
"text": "of tables.",
"orig": "of tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.9,
"r_y0": 210.9,
"r_x1": 545.1,
"r_y1": 210.9,
"r_x2": 545.1,
"r_y2": 202.0,
"r_x3": 354.9,
"r_y3": 202.0,
"coord_origin": "TOPLEFT"
},
"text": "Such large variety requires a flexible method.",
"orig": "Such large variety requires a flexible method.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 222.9,
"r_x1": 545.1,
"r_y1": 222.9,
"r_x2": 545.1,
"r_y2": 214.0,
"r_x3": 308.9,
"r_y3": 214.0,
"coord_origin": "TOPLEFT"
},
"text": "This is especially true for complex column- and row head-",
"orig": "This is especially true for complex column- and row head-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 234.8,
"r_x1": 530.9,
"r_y1": 234.8,
"r_x2": 530.9,
"r_y2": 225.9,
"r_x3": 308.9,
"r_y3": 225.9,
"coord_origin": "TOPLEFT"
},
"text": "ers, which can be extremely intricate and demanding.",
"orig": "ers, which can be extremely intricate and demanding.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 537.9,
"r_y0": 234.8,
"r_x1": 545.1,
"r_y1": 234.8,
"r_x2": 545.1,
"r_y2": 225.9,
"r_x3": 537.9,
"r_y3": 225.9,
"coord_origin": "TOPLEFT"
},
"text": "A",
"orig": "A",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 246.8,
"r_x1": 545.1,
"r_y1": 246.8,
"r_x2": 545.1,
"r_y2": 237.9,
"r_x3": 308.9,
"r_y3": 237.9,
"coord_origin": "TOPLEFT"
},
"text": "second factor of complexity is the lack of data with regard",
"orig": "second factor of complexity is the lack of data with regard",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 258.7,
"r_x1": 545.1,
"r_y1": 258.7,
"r_x2": 545.1,
"r_y2": 249.8,
"r_x3": 308.9,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "to table-structure. Until the publication of PubTabNet [37],",
"orig": "to table-structure. Until the publication of PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 270.7,
"r_x1": 439.8,
"r_y1": 270.7,
"r_x2": 439.8,
"r_y2": 261.8,
"r_x3": 308.9,
"r_y3": 261.8,
"coord_origin": "TOPLEFT"
},
"text": "there were no large datasets (i.e.",
"orig": "there were no large datasets (i.e.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 444.4,
"r_y0": 270.5,
"r_x1": 452.2,
"r_y1": 270.5,
"r_x2": 452.2,
"r_y2": 261.6,
"r_x3": 444.4,
"r_y3": 261.6,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.9,
"r_y0": 270.5,
"r_x1": 470.8,
"r_y1": 270.5,
"r_x2": 470.8,
"r_y2": 261.6,
"r_x3": 455.9,
"r_y3": 261.6,
"coord_origin": "TOPLEFT"
},
"text": "100",
"orig": "100",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 470.8,
"r_y0": 270.7,
"r_x1": 545.1,
"r_y1": 270.7,
"r_x2": 545.1,
"r_y2": 261.8,
"r_x3": 470.8,
"r_y3": 261.8,
"coord_origin": "TOPLEFT"
},
"text": "K tables) that pro-",
"orig": "K tables) that pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 282.6,
"r_x1": 545.1,
"r_y1": 282.6,
"r_x2": 545.1,
"r_y2": 273.7,
"r_x3": 308.9,
"r_y3": 273.7,
"coord_origin": "TOPLEFT"
},
"text": "vided structure information. This happens primarily due to",
"orig": "vided structure information. This happens primarily due to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 294.6,
"r_x1": 545.1,
"r_y1": 294.6,
"r_x2": 545.1,
"r_y2": 285.7,
"r_x3": 308.9,
"r_y3": 285.7,
"coord_origin": "TOPLEFT"
},
"text": "the fact that tables are notoriously time-consuming to an-",
"orig": "the fact that tables are notoriously time-consuming to an-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 306.5,
"r_x1": 545.1,
"r_y1": 306.5,
"r_x2": 545.1,
"r_y2": 297.6,
"r_x3": 308.9,
"r_y3": 297.6,
"coord_origin": "TOPLEFT"
},
"text": "notate by hand. However, this has definitely changed in re-",
"orig": "notate by hand. However, this has definitely changed in re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 318.5,
"r_x1": 545.1,
"r_y1": 318.5,
"r_x2": 545.1,
"r_y2": 309.6,
"r_x3": 308.9,
"r_y3": 309.6,
"coord_origin": "TOPLEFT"
},
"text": "cent years with the deliverance of PubTabNet [37], FinTab-",
"orig": "cent years with the deliverance of PubTabNet [37], FinTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 330.5,
"r_x1": 425.9,
"r_y1": 330.5,
"r_x2": 425.9,
"r_y2": 321.5,
"r_x3": 308.9,
"r_y3": 321.5,
"coord_origin": "TOPLEFT"
},
"text": "Net [36], TableBank [17] etc.",
"orig": "Net [36], TableBank [17] etc.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 342.5,
"r_x1": 545.1,
"r_y1": 342.5,
"r_x2": 545.1,
"r_y2": 333.6,
"r_x3": 320.8,
"r_y3": 333.6,
"coord_origin": "TOPLEFT"
},
"text": "Before the rising popularity of deep neural networks,",
"orig": "Before the rising popularity of deep neural networks,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 354.4,
"r_x1": 545.1,
"r_y1": 354.4,
"r_x2": 545.1,
"r_y2": 345.5,
"r_x3": 308.9,
"r_y3": 345.5,
"coord_origin": "TOPLEFT"
},
"text": "the community relied heavily on heuristic and/or statistical",
"orig": "the community relied heavily on heuristic and/or statistical",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 366.4,
"r_x1": 545.1,
"r_y1": 366.4,
"r_x2": 545.1,
"r_y2": 357.5,
"r_x3": 308.9,
"r_y3": 357.5,
"coord_origin": "TOPLEFT"
},
"text": "methods to do table structure identification [3, 7, 11, 5, 13,",
"orig": "methods to do table structure identification [3, 7, 11, 5, 13,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 378.3,
"r_x1": 545.1,
"r_y1": 378.3,
"r_x2": 545.1,
"r_y2": 369.4,
"r_x3": 308.9,
"r_y3": 369.4,
"coord_origin": "TOPLEFT"
},
"text": "28]. Although such methods work well on constrained ta-",
"orig": "28]. Although such methods work well on constrained ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 390.3,
"r_x1": 545.1,
"r_y1": 390.3,
"r_x2": 545.1,
"r_y2": 381.4,
"r_x3": 308.9,
"r_y3": 381.4,
"coord_origin": "TOPLEFT"
},
"text": "bles [12], a more data-driven approach can be applied due",
"orig": "bles [12], a more data-driven approach can be applied due",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 402.3,
"r_x1": 545.1,
"r_y1": 402.3,
"r_x2": 545.1,
"r_y2": 393.3,
"r_x3": 308.9,
"r_y3": 393.3,
"coord_origin": "TOPLEFT"
},
"text": "to the advent of convolutional neural networks (CNNs) and",
"orig": "to the advent of convolutional neural networks (CNNs) and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 414.2,
"r_x1": 545.1,
"r_y1": 414.2,
"r_x2": 545.1,
"r_y2": 405.3,
"r_x3": 308.9,
"r_y3": 405.3,
"coord_origin": "TOPLEFT"
},
"text": "the availability of large datasets. To the best-of-our knowl-",
"orig": "the availability of large datasets. To the best-of-our knowl-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 426.2,
"r_x1": 545.1,
"r_y1": 426.2,
"r_x2": 545.1,
"r_y2": 417.3,
"r_x3": 308.9,
"r_y3": 417.3,
"coord_origin": "TOPLEFT"
},
"text": "edge, there are currently two different types of network ar-",
"orig": "edge, there are currently two different types of network ar-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 438.1,
"r_x1": 545.1,
"r_y1": 438.1,
"r_x2": 545.1,
"r_y2": 429.2,
"r_x3": 308.9,
"r_y3": 429.2,
"coord_origin": "TOPLEFT"
},
"text": "chitecture that are being pursued for state-of-the-art table-",
"orig": "chitecture that are being pursued for state-of-the-art table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 450.1,
"r_x1": 401.3,
"r_y1": 450.1,
"r_x2": 401.3,
"r_y2": 441.2,
"r_x3": 308.9,
"r_y3": 441.2,
"coord_origin": "TOPLEFT"
},
"text": "structure identification.",
"orig": "structure identification.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 462.0,
"r_x1": 423.3,
"r_y1": 462.0,
"r_x2": 423.3,
"r_y2": 453.1,
"r_x3": 320.8,
"r_y3": 453.1,
"coord_origin": "TOPLEFT"
},
"text": "Image-to-Text networks",
"orig": "Image-to-Text networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 423.3,
"r_y0": 462.1,
"r_x1": 545.1,
"r_y1": 462.1,
"r_x2": 545.1,
"r_y2": 453.2,
"r_x3": 423.3,
"r_y3": 453.2,
"coord_origin": "TOPLEFT"
},
"text": ": In this type of network, one",
"orig": ": In this type of network, one",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 474.0,
"r_x1": 545.1,
"r_y1": 474.0,
"r_x2": 545.1,
"r_y2": 465.1,
"r_x3": 308.9,
"r_y3": 465.1,
"coord_origin": "TOPLEFT"
},
"text": "predicts a sequence of tokens starting from an encoded",
"orig": "predicts a sequence of tokens starting from an encoded",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 486.0,
"r_x1": 335.7,
"r_y1": 486.0,
"r_x2": 335.7,
"r_y2": 477.1,
"r_x3": 308.9,
"r_y3": 477.1,
"coord_origin": "TOPLEFT"
},
"text": "image.",
"orig": "image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.9,
"r_y0": 486.0,
"r_x1": 545.1,
"r_y1": 486.0,
"r_x2": 545.1,
"r_y2": 477.1,
"r_x3": 345.9,
"r_y3": 477.1,
"coord_origin": "TOPLEFT"
},
"text": "Such sequences of tokens can be HTML table",
"orig": "Such sequences of tokens can be HTML table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 498.0,
"r_x1": 545.1,
"r_y1": 498.0,
"r_x2": 545.1,
"r_y2": 489.1,
"r_x3": 308.9,
"r_y3": 489.1,
"coord_origin": "TOPLEFT"
},
"text": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-",
"orig": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 509.9,
"r_x1": 545.1,
"r_y1": 509.9,
"r_x2": 545.1,
"r_y2": 501.0,
"r_x3": 308.9,
"r_y3": 501.0,
"coord_origin": "TOPLEFT"
},
"text": "bols is ultimately not very important, since one can be trans-",
"orig": "bols is ultimately not very important, since one can be trans-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 521.9,
"r_x1": 545.1,
"r_y1": 521.9,
"r_x2": 545.1,
"r_y2": 513.0,
"r_x3": 308.9,
"r_y3": 513.0,
"coord_origin": "TOPLEFT"
},
"text": "formed into the other. There are however subtle variations",
"orig": "formed into the other. There are however subtle variations",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 533.8,
"r_x1": 545.1,
"r_y1": 533.8,
"r_x2": 545.1,
"r_y2": 524.9,
"r_x3": 308.9,
"r_y3": 524.9,
"coord_origin": "TOPLEFT"
},
"text": "in the Image-to-Text networks. The easiest network archi-",
"orig": "in the Image-to-Text networks. The easiest network archi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 545.8,
"r_x1": 420.9,
"r_y1": 545.8,
"r_x2": 420.9,
"r_y2": 536.9,
"r_x3": 308.9,
"r_y3": 536.9,
"coord_origin": "TOPLEFT"
},
"text": "tectures are \u201cimage-encoder",
"orig": "tectures are \u201cimage-encoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 423.6,
"r_y0": 545.6,
"r_x1": 433.6,
"r_y1": 545.6,
"r_x2": 433.6,
"r_y2": 536.2,
"r_x3": 423.6,
"r_y3": 536.2,
"coord_origin": "TOPLEFT"
},
"text": "\u2192",
"orig": "\u2192",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 436.2,
"r_y0": 545.8,
"r_x1": 545.1,
"r_y1": 545.8,
"r_x2": 545.1,
"r_y2": 536.9,
"r_x3": 436.2,
"r_y3": 536.9,
"coord_origin": "TOPLEFT"
},
"text": "text-decoder\u201d (IETD), sim-",
"orig": "text-decoder\u201d (IETD), sim-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 557.7,
"r_x1": 545.1,
"r_y1": 557.7,
"r_x2": 545.1,
"r_y2": 548.8,
"r_x3": 308.9,
"r_y3": 548.8,
"coord_origin": "TOPLEFT"
},
"text": "ilar to network architectures that try to provide captions to",
"orig": "ilar to network architectures that try to provide captions to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 569.7,
"r_x1": 545.1,
"r_y1": 569.7,
"r_x2": 545.1,
"r_y2": 560.8,
"r_x3": 308.9,
"r_y3": 560.8,
"coord_origin": "TOPLEFT"
},
"text": "images [32]. In these IETD networks, one expects as output",
"orig": "images [32]. In these IETD networks, one expects as output",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 581.6,
"r_x1": 545.1,
"r_y1": 581.6,
"r_x2": 545.1,
"r_y2": 572.7,
"r_x3": 308.9,
"r_y3": 572.7,
"coord_origin": "TOPLEFT"
},
"text": "the LaTeX/HTML string of the entire table, i.e. the sym-",
"orig": "the LaTeX/HTML string of the entire table, i.e. the sym-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 593.6,
"r_x1": 545.1,
"r_y1": 593.6,
"r_x2": 545.1,
"r_y2": 584.7,
"r_x3": 308.9,
"r_y3": 584.7,
"coord_origin": "TOPLEFT"
},
"text": "bols necessary for creating the table with the content of the",
"orig": "bols necessary for creating the table with the content of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 605.6,
"r_x1": 497.1,
"r_y1": 605.6,
"r_x2": 497.1,
"r_y2": 596.6,
"r_x3": 308.9,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "table. Another approach is the \u201cimage-encoder",
"orig": "table. Another approach is the \u201cimage-encoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.8,
"r_y0": 605.3,
"r_x1": 509.8,
"r_y1": 605.3,
"r_x2": 509.8,
"r_y2": 595.9,
"r_x3": 499.8,
"r_y3": 595.9,
"coord_origin": "TOPLEFT"
},
"text": "\u2192",
"orig": "\u2192",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.5,
"r_y0": 605.6,
"r_x1": 545.1,
"r_y1": 605.6,
"r_x2": 545.1,
"r_y2": 596.6,
"r_x3": 512.5,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "dual de-",
"orig": "dual de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 617.5,
"r_x1": 545.1,
"r_y1": 617.5,
"r_x2": 545.1,
"r_y2": 608.6,
"r_x3": 308.9,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "coder\u201d (IEDD) networks. In these type of networks, one has",
"orig": "coder\u201d (IEDD) networks. In these type of networks, one has",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 629.5,
"r_x1": 545.1,
"r_y1": 629.5,
"r_x2": 545.1,
"r_y2": 620.6,
"r_x3": 308.9,
"r_y3": 620.6,
"coord_origin": "TOPLEFT"
},
"text": "two consecutive decoders with different purposes. The first",
"orig": "two consecutive decoders with different purposes. The first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 641.4,
"r_x1": 364.8,
"r_y1": 641.4,
"r_x2": 364.8,
"r_y2": 632.5,
"r_x3": 308.9,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": "decoder is the",
"orig": "decoder is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.6,
"r_y0": 641.2,
"r_x1": 415.6,
"r_y1": 641.2,
"r_x2": 415.6,
"r_y2": 632.6,
"r_x3": 367.6,
"r_y3": 632.6,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder",
"orig": "tag-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 415.6,
"r_y0": 641.4,
"r_x1": 545.1,
"r_y1": 641.4,
"r_x2": 545.1,
"r_y2": 632.5,
"r_x3": 415.6,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": ", i.e. it only produces the HTM-",
"orig": ", i.e. it only produces the HTM-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 653.4,
"r_x1": 545.1,
"r_y1": 653.4,
"r_x2": 545.1,
"r_y2": 644.5,
"r_x3": 308.9,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "L/LaTeX tags which construct an empty table. The second",
"orig": "L/LaTeX tags which construct an empty table. The second",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 665.1,
"r_x1": 373.6,
"r_y1": 665.1,
"r_x2": 373.6,
"r_y2": 656.5,
"r_x3": 308.9,
"r_y3": 656.5,
"coord_origin": "TOPLEFT"
},
"text": "content-decoder",
"orig": "content-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 376.9,
"r_y0": 665.3,
"r_x1": 545.1,
"r_y1": 665.3,
"r_x2": 545.1,
"r_y2": 656.4,
"r_x3": 376.9,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "uses the encoding of the image in combi-",
"orig": "uses the encoding of the image in combi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 677.3,
"r_x1": 545.1,
"r_y1": 677.3,
"r_x2": 545.1,
"r_y2": 668.4,
"r_x3": 308.9,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "nation with the output encoding of each cell-tag (from the",
"orig": "nation with the output encoding of each cell-tag (from the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 689.0,
"r_x1": 356.9,
"r_y1": 689.0,
"r_x2": 356.9,
"r_y2": 680.4,
"r_x3": 308.9,
"r_y3": 680.4,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder",
"orig": "tag-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.1,
"r_y0": 689.2,
"r_x1": 545.1,
"r_y1": 689.2,
"r_x2": 545.1,
"r_y2": 680.3,
"r_x3": 357.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": ") to generate the textual content of each table",
"orig": ") to generate the textual content of each table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 308.9,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "cell. The network architecture of IEDD is certainly more",
"orig": "cell. The network architecture of IEDD is certainly more",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 545.1,
"r_y1": 713.2,
"r_x2": 545.1,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "elaborate, but it has the advantage that one can pre-train the",
"orig": "elaborate, but it has the advantage that one can pre-train the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 12,
"label": "text",
"bbox": {
"l": 50.1,
"t": 75.2,
"r": 286.4,
"b": 96.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.1,
"r_x1": 286.4,
"r_y1": 84.1,
"r_x2": 286.4,
"r_y2": 75.2,
"r_x3": 50.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "considered as a solved problem, given enough ground-truth",
"orig": "considered as a solved problem, given enough ground-truth",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 96.1,
"r_x1": 112.6,
"r_y1": 96.1,
"r_x2": 112.6,
"r_y2": 87.2,
"r_x3": 50.1,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "data to train on.",
"orig": "data to train on.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "text",
"bbox": {
"l": 50.1,
"t": 99.6,
"r": 286.4,
"b": 228.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 108.5,
"r_x1": 286.4,
"r_y1": 108.5,
"r_x2": 286.4,
"r_y2": 99.6,
"r_x3": 62.1,
"r_y3": 99.6,
"coord_origin": "TOPLEFT"
},
"text": "The second problem is called table-structure decompo-",
"orig": "The second problem is called table-structure decompo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 120.4,
"r_x1": 74.7,
"r_y1": 120.4,
"r_x2": 74.7,
"r_y2": 111.5,
"r_x3": 50.1,
"r_y3": 111.5,
"coord_origin": "TOPLEFT"
},
"text": "sition.",
"orig": "sition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.3,
"r_y0": 120.4,
"r_x1": 286.4,
"r_y1": 120.4,
"r_x2": 286.4,
"r_y2": 111.5,
"r_x3": 81.3,
"r_y3": 111.5,
"coord_origin": "TOPLEFT"
},
"text": "The latter is a long standing problem in the com-",
"orig": "The latter is a long standing problem in the com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 132.4,
"r_x1": 286.4,
"r_y1": 132.4,
"r_x2": 286.4,
"r_y2": 123.5,
"r_x3": 50.1,
"r_y3": 123.5,
"coord_origin": "TOPLEFT"
},
"text": "munity of document understanding [6, 4, 14]. Contrary to",
"orig": "munity of document understanding [6, 4, 14]. Contrary to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 144.3,
"r_x1": 286.4,
"r_y1": 144.3,
"r_x2": 286.4,
"r_y2": 135.4,
"r_x3": 50.1,
"r_y3": 135.4,
"coord_origin": "TOPLEFT"
},
"text": "the table-location problem, there are no commonly used ap-",
"orig": "the table-location problem, there are no commonly used ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 156.3,
"r_x1": 286.4,
"r_y1": 156.3,
"r_x2": 286.4,
"r_y2": 147.4,
"r_x3": 50.1,
"r_y3": 147.4,
"coord_origin": "TOPLEFT"
},
"text": "proaches that can easily be re-purposed to solve this prob-",
"orig": "proaches that can easily be re-purposed to solve this prob-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 168.3,
"r_x1": 286.4,
"r_y1": 168.3,
"r_x2": 286.4,
"r_y2": 159.3,
"r_x3": 50.1,
"r_y3": 159.3,
"coord_origin": "TOPLEFT"
},
"text": "lem. Lately, a set of new model-architectures has been pro-",
"orig": "lem. Lately, a set of new model-architectures has been pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 180.2,
"r_x1": 286.4,
"r_y1": 180.2,
"r_x2": 286.4,
"r_y2": 171.3,
"r_x3": 50.1,
"r_y3": 171.3,
"coord_origin": "TOPLEFT"
},
"text": "posed by the community to address table-structure decom-",
"orig": "posed by the community to address table-structure decom-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 192.2,
"r_x1": 286.4,
"r_y1": 192.2,
"r_x2": 286.4,
"r_y2": 183.3,
"r_x3": 50.1,
"r_y3": 183.3,
"coord_origin": "TOPLEFT"
},
"text": "position [37, 36, 18, 20]. All these models have some weak-",
"orig": "position [37, 36, 18, 20]. All these models have some weak-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 204.1,
"r_x1": 286.4,
"r_y1": 204.1,
"r_x2": 286.4,
"r_y2": 195.2,
"r_x3": 50.1,
"r_y3": 195.2,
"coord_origin": "TOPLEFT"
},
"text": "nesses (see Sec. 2). The common denominator here is the",
"orig": "nesses (see Sec. 2). The common denominator here is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 216.1,
"r_x1": 286.4,
"r_y1": 216.1,
"r_x2": 286.4,
"r_y2": 207.2,
"r_x3": 50.1,
"r_y3": 207.2,
"coord_origin": "TOPLEFT"
},
"text": "reliance on textual features and/or the inability to provide",
"orig": "reliance on textual features and/or the inability to provide",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 228.0,
"r_x1": 278.7,
"r_y1": 228.0,
"r_x2": 278.7,
"r_y2": 219.1,
"r_x3": 50.1,
"r_y3": 219.1,
"coord_origin": "TOPLEFT"
},
"text": "the bounding box of each table-cell in the original image.",
"orig": "the bounding box of each table-cell in the original image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "text",
"bbox": {
"l": 50.1,
"t": 231.5,
"r": 286.4,
"b": 371.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 240.4,
"r_x1": 286.4,
"r_y1": 240.4,
"r_x2": 286.4,
"r_y2": 231.5,
"r_x3": 62.1,
"r_y3": 231.5,
"coord_origin": "TOPLEFT"
},
"text": "In this paper, we want to address these weaknesses and",
"orig": "In this paper, we want to address these weaknesses and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 252.4,
"r_x1": 286.4,
"r_y1": 252.4,
"r_x2": 286.4,
"r_y2": 243.5,
"r_x3": 50.1,
"r_y3": 243.5,
"coord_origin": "TOPLEFT"
},
"text": "present a robust table-structure decomposition algorithm.",
"orig": "present a robust table-structure decomposition algorithm.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 264.3,
"r_x1": 286.4,
"r_y1": 264.3,
"r_x2": 286.4,
"r_y2": 255.4,
"r_x3": 50.1,
"r_y3": 255.4,
"coord_origin": "TOPLEFT"
},
"text": "The design criteria for our model are the following. First,",
"orig": "The design criteria for our model are the following. First,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 276.3,
"r_x1": 286.4,
"r_y1": 276.3,
"r_x2": 286.4,
"r_y2": 267.4,
"r_x3": 50.1,
"r_y3": 267.4,
"coord_origin": "TOPLEFT"
},
"text": "we want our algorithm to be language agnostic. In this way,",
"orig": "we want our algorithm to be language agnostic. In this way,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 288.3,
"r_x1": 286.4,
"r_y1": 288.3,
"r_x2": 286.4,
"r_y2": 279.4,
"r_x3": 50.1,
"r_y3": 279.4,
"coord_origin": "TOPLEFT"
},
"text": "we can obtain the structure of any table, irregardless of the",
"orig": "we can obtain the structure of any table, irregardless of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 300.2,
"r_x1": 88.6,
"r_y1": 300.2,
"r_x2": 88.6,
"r_y2": 291.3,
"r_x3": 50.1,
"r_y3": 291.3,
"coord_origin": "TOPLEFT"
},
"text": "language.",
"orig": "language.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 95.5,
"r_y0": 300.2,
"r_x1": 286.4,
"r_y1": 300.2,
"r_x2": 286.4,
"r_y2": 291.3,
"r_x3": 95.5,
"r_y3": 291.3,
"coord_origin": "TOPLEFT"
},
"text": "Second, we want our algorithm to leverage as",
"orig": "Second, we want our algorithm to leverage as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 312.2,
"r_x1": 286.4,
"r_y1": 312.2,
"r_x2": 286.4,
"r_y2": 303.3,
"r_x3": 50.1,
"r_y3": 303.3,
"coord_origin": "TOPLEFT"
},
"text": "much data as possible from the original PDF document. For",
"orig": "much data as possible from the original PDF document. For",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 324.1,
"r_x1": 286.4,
"r_y1": 324.1,
"r_x2": 286.4,
"r_y2": 315.2,
"r_x3": 50.1,
"r_y3": 315.2,
"coord_origin": "TOPLEFT"
},
"text": "programmatic PDF documents, the text-cells can often be",
"orig": "programmatic PDF documents, the text-cells can often be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 336.1,
"r_x1": 286.4,
"r_y1": 336.1,
"r_x2": 286.4,
"r_y2": 327.2,
"r_x3": 50.1,
"r_y3": 327.2,
"coord_origin": "TOPLEFT"
},
"text": "extracted much faster and with higher accuracy compared",
"orig": "extracted much faster and with higher accuracy compared",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 348.0,
"r_x1": 286.4,
"r_y1": 348.0,
"r_x2": 286.4,
"r_y2": 339.1,
"r_x3": 50.1,
"r_y3": 339.1,
"coord_origin": "TOPLEFT"
},
"text": "to OCR methods. Last but not least, we want to have a di-",
"orig": "to OCR methods. Last but not least, we want to have a di-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 360.0,
"r_x1": 286.4,
"r_y1": 360.0,
"r_x2": 286.4,
"r_y2": 351.1,
"r_x3": 50.1,
"r_y3": 351.1,
"coord_origin": "TOPLEFT"
},
"text": "rect link between the table-cell and its bounding box in the",
"orig": "rect link between the table-cell and its bounding box in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 371.9,
"r_x1": 77.0,
"r_y1": 371.9,
"r_x2": 77.0,
"r_y2": 363.0,
"r_x3": 50.1,
"r_y3": 363.0,
"coord_origin": "TOPLEFT"
},
"text": "image.",
"orig": "image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 7,
"label": "text",
"bbox": {
"l": 50.1,
"t": 375.4,
"r": 286.4,
"b": 432.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 384.4,
"r_x1": 286.4,
"r_y1": 384.4,
"r_x2": 286.4,
"r_y2": 375.4,
"r_x3": 62.1,
"r_y3": 375.4,
"coord_origin": "TOPLEFT"
},
"text": "To meet the design criteria listed above, we developed a",
"orig": "To meet the design criteria listed above, we developed a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 396.3,
"r_x1": 121.0,
"r_y1": 396.3,
"r_x2": 121.0,
"r_y2": 387.4,
"r_x3": 50.1,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "new model called",
"orig": "new model called",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 123.9,
"r_y0": 396.2,
"r_x1": 179.7,
"r_y1": 396.2,
"r_x2": 179.7,
"r_y2": 387.3,
"r_x3": 123.9,
"r_y3": 387.3,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.6,
"r_y0": 396.3,
"r_x1": 286.4,
"r_y1": 396.3,
"r_x2": 286.4,
"r_y2": 387.4,
"r_x3": 182.6,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "and a synthetically gener-",
"orig": "and a synthetically gener-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 408.3,
"r_x1": 181.8,
"r_y1": 408.3,
"r_x2": 181.8,
"r_y2": 399.4,
"r_x3": 50.1,
"r_y3": 399.4,
"coord_origin": "TOPLEFT"
},
"text": "ated table structure dataset called",
"orig": "ated table structure dataset called",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.1,
"r_y0": 408.2,
"r_x1": 240.2,
"r_y1": 408.2,
"r_x2": 240.2,
"r_y2": 399.2,
"r_x3": 184.1,
"r_y3": 399.2,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 240.2,
"r_y0": 408.3,
"r_x1": 286.4,
"r_y1": 408.3,
"r_x2": 286.4,
"r_y2": 399.4,
"r_x3": 240.2,
"r_y3": 399.4,
"coord_origin": "TOPLEFT"
},
"text": "$^{1}$. In partic-",
"orig": "$^{1}$. In partic-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 420.2,
"r_x1": 286.4,
"r_y1": 420.2,
"r_x2": 286.4,
"r_y2": 411.3,
"r_x3": 50.1,
"r_y3": 411.3,
"coord_origin": "TOPLEFT"
},
"text": "ular, our contributions in this work can be summarised as",
"orig": "ular, our contributions in this work can be summarised as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 432.2,
"r_x1": 82.5,
"r_y1": 432.2,
"r_x2": 82.5,
"r_y2": 423.3,
"r_x3": 50.1,
"r_y3": 423.3,
"coord_origin": "TOPLEFT"
},
"text": "follows:",
"orig": "follows:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 6,
"label": "list_item",
"bbox": {
"l": 61.6,
"t": 444.4,
"r": 286.4,
"b": 489.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 453.5,
"r_x1": 70.7,
"r_y1": 453.5,
"r_x2": 70.7,
"r_y2": 444.6,
"r_x3": 61.6,
"r_y3": 444.6,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.0,
"r_y0": 453.5,
"r_x1": 117.1,
"r_y1": 453.5,
"r_x2": 117.1,
"r_y2": 444.6,
"r_x3": 73.0,
"r_y3": 444.6,
"coord_origin": "TOPLEFT"
},
"text": "We propose",
"orig": "We propose",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.6,
"r_y0": 453.4,
"r_x1": 175.4,
"r_y1": 453.4,
"r_x2": 175.4,
"r_y2": 444.4,
"r_x3": 119.6,
"r_y3": 444.4,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.4,
"r_y0": 453.5,
"r_x1": 286.4,
"r_y1": 453.5,
"r_x2": 286.4,
"r_y2": 444.6,
"r_x3": 175.4,
"r_y3": 444.6,
"coord_origin": "TOPLEFT"
},
"text": ", a transformer based model",
"orig": ", a transformer based model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 465.4,
"r_x1": 286.4,
"r_y1": 465.4,
"r_x2": 286.4,
"r_y2": 456.5,
"r_x3": 70.0,
"r_y3": 456.5,
"coord_origin": "TOPLEFT"
},
"text": "that predicts tables structure and bounding boxes for",
"orig": "that predicts tables structure and bounding boxes for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 477.4,
"r_x1": 286.4,
"r_y1": 477.4,
"r_x2": 286.4,
"r_y2": 468.5,
"r_x3": 70.0,
"r_y3": 468.5,
"coord_origin": "TOPLEFT"
},
"text": "the table content simultaneously in an end-to-end ap-",
"orig": "the table content simultaneously in an end-to-end ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 489.3,
"r_x1": 99.6,
"r_y1": 489.3,
"r_x2": 99.6,
"r_y2": 480.4,
"r_x3": 70.0,
"r_y3": 480.4,
"coord_origin": "TOPLEFT"
},
"text": "proach.",
"orig": "proach.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 5,
"label": "list_item",
"bbox": {
"l": 61.6,
"t": 502.0,
"r": 286.4,
"b": 546.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 511.1,
"r_x1": 71.6,
"r_y1": 511.1,
"r_x2": 71.6,
"r_y2": 502.2,
"r_x3": 61.6,
"r_y3": 502.2,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.1,
"r_y0": 511.1,
"r_x1": 196.1,
"r_y1": 511.1,
"r_x2": 196.1,
"r_y2": 502.2,
"r_x3": 74.1,
"r_y3": 502.2,
"coord_origin": "TOPLEFT"
},
"text": "Across all benchmark datasets",
"orig": "Across all benchmark datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.3,
"r_y0": 511.0,
"r_x1": 256.1,
"r_y1": 511.0,
"r_x2": 256.1,
"r_y2": 502.0,
"r_x3": 200.3,
"r_y3": 502.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 260.4,
"r_y0": 511.1,
"r_x1": 286.4,
"r_y1": 511.1,
"r_x2": 286.4,
"r_y2": 502.2,
"r_x3": 260.4,
"r_y3": 502.2,
"coord_origin": "TOPLEFT"
},
"text": "signif-",
"orig": "signif-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 523.0,
"r_x1": 286.4,
"r_y1": 523.0,
"r_x2": 286.4,
"r_y2": 514.1,
"r_x3": 70.0,
"r_y3": 514.1,
"coord_origin": "TOPLEFT"
},
"text": "icantly outperforms existing state-of-the-art metrics,",
"orig": "icantly outperforms existing state-of-the-art metrics,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 535.0,
"r_x1": 286.4,
"r_y1": 535.0,
"r_x2": 286.4,
"r_y2": 526.1,
"r_x3": 70.0,
"r_y3": 526.1,
"coord_origin": "TOPLEFT"
},
"text": "while being much more efficient in training and infer-",
"orig": "while being much more efficient in training and infer-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 546.9,
"r_x1": 161.7,
"r_y1": 546.9,
"r_x2": 161.7,
"r_y2": 538.0,
"r_x3": 70.0,
"r_y3": 538.0,
"coord_origin": "TOPLEFT"
},
"text": "ence to existing works.",
"orig": "ence to existing works.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 9,
"label": "list_item",
"bbox": {
"l": 61.6,
"t": 559.6,
"r": 286.4,
"b": 592.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 568.7,
"r_x1": 71.1,
"r_y1": 568.7,
"r_x2": 71.1,
"r_y2": 559.8,
"r_x3": 61.6,
"r_y3": 559.8,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.5,
"r_y0": 568.7,
"r_x1": 116.7,
"r_y1": 568.7,
"r_x2": 116.7,
"r_y2": 559.8,
"r_x3": 73.5,
"r_y3": 559.8,
"coord_origin": "TOPLEFT"
},
"text": "We present",
"orig": "We present",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 121.6,
"r_y0": 568.6,
"r_x1": 177.7,
"r_y1": 568.6,
"r_x2": 177.7,
"r_y2": 559.6,
"r_x3": 121.6,
"r_y3": 559.6,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.6,
"r_y0": 568.7,
"r_x1": 286.4,
"r_y1": 568.7,
"r_x2": 286.4,
"r_y2": 559.8,
"r_x3": 182.6,
"r_y3": 559.8,
"coord_origin": "TOPLEFT"
},
"text": "a synthetically generated",
"orig": "a synthetically generated",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 580.6,
"r_x1": 286.4,
"r_y1": 580.6,
"r_x2": 286.4,
"r_y2": 571.7,
"r_x3": 70.0,
"r_y3": 571.7,
"coord_origin": "TOPLEFT"
},
"text": "dataset, with various appearance styles and complex-",
"orig": "dataset, with various appearance styles and complex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 592.6,
"r_x1": 82.4,
"r_y1": 592.6,
"r_x2": 82.4,
"r_y2": 583.7,
"r_x3": 70.0,
"r_y3": 583.7,
"coord_origin": "TOPLEFT"
},
"text": "ity.",
"orig": "ity.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 8,
"label": "list_item",
"bbox": {
"l": 61.6,
"t": 605.4,
"r": 286.4,
"b": 638.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 614.3,
"r_x1": 72.3,
"r_y1": 614.3,
"r_x2": 72.3,
"r_y2": 605.4,
"r_x3": 61.6,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 75.0,
"r_y0": 614.3,
"r_x1": 286.4,
"r_y1": 614.3,
"r_x2": 286.4,
"r_y2": 605.4,
"r_x3": 75.0,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "An augmented dataset based on PubTabNet [37],",
"orig": "An augmented dataset based on PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 626.3,
"r_x1": 286.4,
"r_y1": 626.3,
"r_x2": 286.4,
"r_y2": 617.4,
"r_x3": 70.0,
"r_y3": 617.4,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet [36], and TableBank [17] with generated",
"orig": "FinTabNet [36], and TableBank [17] with generated",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 638.2,
"r_x1": 198.1,
"r_y1": 638.2,
"r_x2": 198.1,
"r_y2": 629.3,
"r_x3": 70.0,
"r_y3": 629.3,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth for reproducibility.",
"orig": "ground-truth for reproducibility.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 11,
"label": "text",
"bbox": {
"l": 50.1,
"t": 650.6,
"r": 286.4,
"b": 695.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 659.5,
"r_x1": 286.4,
"r_y1": 659.5,
"r_x2": 286.4,
"r_y2": 650.6,
"r_x3": 62.1,
"r_y3": 650.6,
"coord_origin": "TOPLEFT"
},
"text": "The paper is structured as follows. In Sec. 2, we give",
"orig": "The paper is structured as follows. In Sec. 2, we give",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 671.5,
"r_x1": 286.4,
"r_y1": 671.5,
"r_x2": 286.4,
"r_y2": 662.6,
"r_x3": 50.1,
"r_y3": 662.6,
"coord_origin": "TOPLEFT"
},
"text": "a brief overview of the current state-of-the-art. In Sec. 3,",
"orig": "a brief overview of the current state-of-the-art. In Sec. 3,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 683.4,
"r_x1": 286.4,
"r_y1": 683.4,
"r_x2": 286.4,
"r_y2": 674.5,
"r_x3": 50.1,
"r_y3": 674.5,
"coord_origin": "TOPLEFT"
},
"text": "we describe the datasets on which we train. In Sec. 4, we",
"orig": "we describe the datasets on which we train. In Sec. 4, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 695.4,
"r_x1": 286.4,
"r_y1": 695.4,
"r_x2": 286.4,
"r_y2": 686.5,
"r_x3": 50.1,
"r_y3": 686.5,
"coord_origin": "TOPLEFT"
},
"text": "introduce the TableFormer model-architecture and describe",
"orig": "introduce the TableFormer model-architecture and describe",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 14,
"label": "footnote",
"bbox": {
"l": 61.0,
"t": 705.6,
"r": 183.7,
"b": 712.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.0,
"r_y0": 712.7,
"r_x1": 183.7,
"r_y1": 712.7,
"r_x2": 183.7,
"r_y2": 705.6,
"r_x3": 61.0,
"r_y3": 705.6,
"coord_origin": "TOPLEFT"
},
"text": "$^{1}$https://github.com/IBM/SynthTabNet",
"orig": "$^{1}$https://github.com/IBM/SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 10,
"label": "text",
"bbox": {
"l": 308.9,
"t": 75.2,
"r": 545.1,
"b": 108.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 84.1,
"r_x1": 545.1,
"r_y1": 84.1,
"r_x2": 545.1,
"r_y2": 75.2,
"r_x3": 308.9,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "its results & performance in Sec. 5. As a conclusion, we de-",
"orig": "its results & performance in Sec. 5. As a conclusion, we de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 96.1,
"r_x1": 545.1,
"r_y1": 96.1,
"r_x2": 545.1,
"r_y2": 87.2,
"r_x3": 308.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "scribe how this new model-architecture can be re-purposed",
"orig": "scribe how this new model-architecture can be re-purposed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 108.0,
"r_x1": 508.1,
"r_y1": 108.0,
"r_x2": 508.1,
"r_y2": 99.1,
"r_x3": 308.9,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "for other tasks in the computer-vision community.",
"orig": "for other tasks in the computer-vision community.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 13,
"label": "section_header",
"bbox": {
"l": 308.9,
"t": 121.7,
"r": 498.3,
"b": 132.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 132.5,
"r_x1": 315.6,
"r_y1": 132.5,
"r_x2": 315.6,
"r_y2": 121.7,
"r_x3": 308.9,
"r_y3": 121.7,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 324.5,
"r_y0": 132.5,
"r_x1": 498.3,
"r_y1": 132.5,
"r_x2": 498.3,
"r_y2": 121.7,
"r_x3": 324.5,
"r_y3": 121.7,
"coord_origin": "TOPLEFT"
},
"text": "Previous work and State of the Art",
"orig": "Previous work and State of the Art",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 0,
"label": "text",
"bbox": {
"l": 308.9,
"t": 142.2,
"r": 545.1,
"b": 330.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 151.1,
"r_x1": 545.1,
"r_y1": 151.1,
"r_x2": 545.1,
"r_y2": 142.2,
"r_x3": 320.8,
"r_y3": 142.2,
"coord_origin": "TOPLEFT"
},
"text": "Identifying the structure of a table has been an outstand-",
"orig": "Identifying the structure of a table has been an outstand-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 163.1,
"r_x1": 545.1,
"r_y1": 163.1,
"r_x2": 545.1,
"r_y2": 154.2,
"r_x3": 308.9,
"r_y3": 154.2,
"coord_origin": "TOPLEFT"
},
"text": "ing problem in the document-parsing community, that mo-",
"orig": "ing problem in the document-parsing community, that mo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 175.0,
"r_x1": 522.6,
"r_y1": 175.0,
"r_x2": 522.6,
"r_y2": 166.1,
"r_x3": 308.9,
"r_y3": 166.1,
"coord_origin": "TOPLEFT"
},
"text": "tivates many organised public challenges [6, 4, 14].",
"orig": "tivates many organised public challenges [6, 4, 14].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 529.6,
"r_y0": 175.0,
"r_x1": 545.1,
"r_y1": 175.0,
"r_x2": 545.1,
"r_y2": 166.1,
"r_x3": 529.6,
"r_y3": 166.1,
"coord_origin": "TOPLEFT"
},
"text": "The",
"orig": "The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 187.0,
"r_x1": 545.1,
"r_y1": 187.0,
"r_x2": 545.1,
"r_y2": 178.1,
"r_x3": 308.9,
"r_y3": 178.1,
"coord_origin": "TOPLEFT"
},
"text": "difficulty of the problem can be attributed to a number of",
"orig": "difficulty of the problem can be attributed to a number of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 198.9,
"r_x1": 545.1,
"r_y1": 198.9,
"r_x2": 545.1,
"r_y2": 190.0,
"r_x3": 308.9,
"r_y3": 190.0,
"coord_origin": "TOPLEFT"
},
"text": "factors. First, there is a large variety in the shapes and sizes",
"orig": "factors. First, there is a large variety in the shapes and sizes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 210.9,
"r_x1": 347.0,
"r_y1": 210.9,
"r_x2": 347.0,
"r_y2": 202.0,
"r_x3": 308.9,
"r_y3": 202.0,
"coord_origin": "TOPLEFT"
},
"text": "of tables.",
"orig": "of tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.9,
"r_y0": 210.9,
"r_x1": 545.1,
"r_y1": 210.9,
"r_x2": 545.1,
"r_y2": 202.0,
"r_x3": 354.9,
"r_y3": 202.0,
"coord_origin": "TOPLEFT"
},
"text": "Such large variety requires a flexible method.",
"orig": "Such large variety requires a flexible method.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 222.9,
"r_x1": 545.1,
"r_y1": 222.9,
"r_x2": 545.1,
"r_y2": 214.0,
"r_x3": 308.9,
"r_y3": 214.0,
"coord_origin": "TOPLEFT"
},
"text": "This is especially true for complex column- and row head-",
"orig": "This is especially true for complex column- and row head-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 234.8,
"r_x1": 530.9,
"r_y1": 234.8,
"r_x2": 530.9,
"r_y2": 225.9,
"r_x3": 308.9,
"r_y3": 225.9,
"coord_origin": "TOPLEFT"
},
"text": "ers, which can be extremely intricate and demanding.",
"orig": "ers, which can be extremely intricate and demanding.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 537.9,
"r_y0": 234.8,
"r_x1": 545.1,
"r_y1": 234.8,
"r_x2": 545.1,
"r_y2": 225.9,
"r_x3": 537.9,
"r_y3": 225.9,
"coord_origin": "TOPLEFT"
},
"text": "A",
"orig": "A",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 246.8,
"r_x1": 545.1,
"r_y1": 246.8,
"r_x2": 545.1,
"r_y2": 237.9,
"r_x3": 308.9,
"r_y3": 237.9,
"coord_origin": "TOPLEFT"
},
"text": "second factor of complexity is the lack of data with regard",
"orig": "second factor of complexity is the lack of data with regard",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 258.7,
"r_x1": 545.1,
"r_y1": 258.7,
"r_x2": 545.1,
"r_y2": 249.8,
"r_x3": 308.9,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "to table-structure. Until the publication of PubTabNet [37],",
"orig": "to table-structure. Until the publication of PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 270.7,
"r_x1": 439.8,
"r_y1": 270.7,
"r_x2": 439.8,
"r_y2": 261.8,
"r_x3": 308.9,
"r_y3": 261.8,
"coord_origin": "TOPLEFT"
},
"text": "there were no large datasets (i.e.",
"orig": "there were no large datasets (i.e.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 444.4,
"r_y0": 270.5,
"r_x1": 452.2,
"r_y1": 270.5,
"r_x2": 452.2,
"r_y2": 261.6,
"r_x3": 444.4,
"r_y3": 261.6,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.9,
"r_y0": 270.5,
"r_x1": 470.8,
"r_y1": 270.5,
"r_x2": 470.8,
"r_y2": 261.6,
"r_x3": 455.9,
"r_y3": 261.6,
"coord_origin": "TOPLEFT"
},
"text": "100",
"orig": "100",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 470.8,
"r_y0": 270.7,
"r_x1": 545.1,
"r_y1": 270.7,
"r_x2": 545.1,
"r_y2": 261.8,
"r_x3": 470.8,
"r_y3": 261.8,
"coord_origin": "TOPLEFT"
},
"text": "K tables) that pro-",
"orig": "K tables) that pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 282.6,
"r_x1": 545.1,
"r_y1": 282.6,
"r_x2": 545.1,
"r_y2": 273.7,
"r_x3": 308.9,
"r_y3": 273.7,
"coord_origin": "TOPLEFT"
},
"text": "vided structure information. This happens primarily due to",
"orig": "vided structure information. This happens primarily due to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 294.6,
"r_x1": 545.1,
"r_y1": 294.6,
"r_x2": 545.1,
"r_y2": 285.7,
"r_x3": 308.9,
"r_y3": 285.7,
"coord_origin": "TOPLEFT"
},
"text": "the fact that tables are notoriously time-consuming to an-",
"orig": "the fact that tables are notoriously time-consuming to an-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 306.5,
"r_x1": 545.1,
"r_y1": 306.5,
"r_x2": 545.1,
"r_y2": 297.6,
"r_x3": 308.9,
"r_y3": 297.6,
"coord_origin": "TOPLEFT"
},
"text": "notate by hand. However, this has definitely changed in re-",
"orig": "notate by hand. However, this has definitely changed in re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 318.5,
"r_x1": 545.1,
"r_y1": 318.5,
"r_x2": 545.1,
"r_y2": 309.6,
"r_x3": 308.9,
"r_y3": 309.6,
"coord_origin": "TOPLEFT"
},
"text": "cent years with the deliverance of PubTabNet [37], FinTab-",
"orig": "cent years with the deliverance of PubTabNet [37], FinTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 330.5,
"r_x1": 425.9,
"r_y1": 330.5,
"r_x2": 425.9,
"r_y2": 321.5,
"r_x3": 308.9,
"r_y3": 321.5,
"coord_origin": "TOPLEFT"
},
"text": "Net [36], TableBank [17] etc.",
"orig": "Net [36], TableBank [17] etc.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "text",
"bbox": {
"l": 308.9,
"t": 333.6,
"r": 545.1,
"b": 450.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 342.5,
"r_x1": 545.1,
"r_y1": 342.5,
"r_x2": 545.1,
"r_y2": 333.6,
"r_x3": 320.8,
"r_y3": 333.6,
"coord_origin": "TOPLEFT"
},
"text": "Before the rising popularity of deep neural networks,",
"orig": "Before the rising popularity of deep neural networks,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 354.4,
"r_x1": 545.1,
"r_y1": 354.4,
"r_x2": 545.1,
"r_y2": 345.5,
"r_x3": 308.9,
"r_y3": 345.5,
"coord_origin": "TOPLEFT"
},
"text": "the community relied heavily on heuristic and/or statistical",
"orig": "the community relied heavily on heuristic and/or statistical",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 366.4,
"r_x1": 545.1,
"r_y1": 366.4,
"r_x2": 545.1,
"r_y2": 357.5,
"r_x3": 308.9,
"r_y3": 357.5,
"coord_origin": "TOPLEFT"
},
"text": "methods to do table structure identification [3, 7, 11, 5, 13,",
"orig": "methods to do table structure identification [3, 7, 11, 5, 13,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 378.3,
"r_x1": 545.1,
"r_y1": 378.3,
"r_x2": 545.1,
"r_y2": 369.4,
"r_x3": 308.9,
"r_y3": 369.4,
"coord_origin": "TOPLEFT"
},
"text": "28]. Although such methods work well on constrained ta-",
"orig": "28]. Although such methods work well on constrained ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 390.3,
"r_x1": 545.1,
"r_y1": 390.3,
"r_x2": 545.1,
"r_y2": 381.4,
"r_x3": 308.9,
"r_y3": 381.4,
"coord_origin": "TOPLEFT"
},
"text": "bles [12], a more data-driven approach can be applied due",
"orig": "bles [12], a more data-driven approach can be applied due",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 402.3,
"r_x1": 545.1,
"r_y1": 402.3,
"r_x2": 545.1,
"r_y2": 393.3,
"r_x3": 308.9,
"r_y3": 393.3,
"coord_origin": "TOPLEFT"
},
"text": "to the advent of convolutional neural networks (CNNs) and",
"orig": "to the advent of convolutional neural networks (CNNs) and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 414.2,
"r_x1": 545.1,
"r_y1": 414.2,
"r_x2": 545.1,
"r_y2": 405.3,
"r_x3": 308.9,
"r_y3": 405.3,
"coord_origin": "TOPLEFT"
},
"text": "the availability of large datasets. To the best-of-our knowl-",
"orig": "the availability of large datasets. To the best-of-our knowl-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 426.2,
"r_x1": 545.1,
"r_y1": 426.2,
"r_x2": 545.1,
"r_y2": 417.3,
"r_x3": 308.9,
"r_y3": 417.3,
"coord_origin": "TOPLEFT"
},
"text": "edge, there are currently two different types of network ar-",
"orig": "edge, there are currently two different types of network ar-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 438.1,
"r_x1": 545.1,
"r_y1": 438.1,
"r_x2": 545.1,
"r_y2": 429.2,
"r_x3": 308.9,
"r_y3": 429.2,
"coord_origin": "TOPLEFT"
},
"text": "chitecture that are being pursued for state-of-the-art table-",
"orig": "chitecture that are being pursued for state-of-the-art table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 450.1,
"r_x1": 401.3,
"r_y1": 450.1,
"r_x2": 401.3,
"r_y2": 441.2,
"r_x3": 308.9,
"r_y3": 441.2,
"coord_origin": "TOPLEFT"
},
"text": "structure identification.",
"orig": "structure identification.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "text",
"bbox": {
"l": 308.9,
"t": 453.1,
"r": 545.1,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 462.0,
"r_x1": 423.3,
"r_y1": 462.0,
"r_x2": 423.3,
"r_y2": 453.1,
"r_x3": 320.8,
"r_y3": 453.1,
"coord_origin": "TOPLEFT"
},
"text": "Image-to-Text networks",
"orig": "Image-to-Text networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 423.3,
"r_y0": 462.1,
"r_x1": 545.1,
"r_y1": 462.1,
"r_x2": 545.1,
"r_y2": 453.2,
"r_x3": 423.3,
"r_y3": 453.2,
"coord_origin": "TOPLEFT"
},
"text": ": In this type of network, one",
"orig": ": In this type of network, one",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 474.0,
"r_x1": 545.1,
"r_y1": 474.0,
"r_x2": 545.1,
"r_y2": 465.1,
"r_x3": 308.9,
"r_y3": 465.1,
"coord_origin": "TOPLEFT"
},
"text": "predicts a sequence of tokens starting from an encoded",
"orig": "predicts a sequence of tokens starting from an encoded",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 486.0,
"r_x1": 335.7,
"r_y1": 486.0,
"r_x2": 335.7,
"r_y2": 477.1,
"r_x3": 308.9,
"r_y3": 477.1,
"coord_origin": "TOPLEFT"
},
"text": "image.",
"orig": "image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.9,
"r_y0": 486.0,
"r_x1": 545.1,
"r_y1": 486.0,
"r_x2": 545.1,
"r_y2": 477.1,
"r_x3": 345.9,
"r_y3": 477.1,
"coord_origin": "TOPLEFT"
},
"text": "Such sequences of tokens can be HTML table",
"orig": "Such sequences of tokens can be HTML table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 498.0,
"r_x1": 545.1,
"r_y1": 498.0,
"r_x2": 545.1,
"r_y2": 489.1,
"r_x3": 308.9,
"r_y3": 489.1,
"coord_origin": "TOPLEFT"
},
"text": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-",
"orig": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 509.9,
"r_x1": 545.1,
"r_y1": 509.9,
"r_x2": 545.1,
"r_y2": 501.0,
"r_x3": 308.9,
"r_y3": 501.0,
"coord_origin": "TOPLEFT"
},
"text": "bols is ultimately not very important, since one can be trans-",
"orig": "bols is ultimately not very important, since one can be trans-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 521.9,
"r_x1": 545.1,
"r_y1": 521.9,
"r_x2": 545.1,
"r_y2": 513.0,
"r_x3": 308.9,
"r_y3": 513.0,
"coord_origin": "TOPLEFT"
},
"text": "formed into the other. There are however subtle variations",
"orig": "formed into the other. There are however subtle variations",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 533.8,
"r_x1": 545.1,
"r_y1": 533.8,
"r_x2": 545.1,
"r_y2": 524.9,
"r_x3": 308.9,
"r_y3": 524.9,
"coord_origin": "TOPLEFT"
},
"text": "in the Image-to-Text networks. The easiest network archi-",
"orig": "in the Image-to-Text networks. The easiest network archi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 545.8,
"r_x1": 420.9,
"r_y1": 545.8,
"r_x2": 420.9,
"r_y2": 536.9,
"r_x3": 308.9,
"r_y3": 536.9,
"coord_origin": "TOPLEFT"
},
"text": "tectures are \u201cimage-encoder",
"orig": "tectures are \u201cimage-encoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 423.6,
"r_y0": 545.6,
"r_x1": 433.6,
"r_y1": 545.6,
"r_x2": 433.6,
"r_y2": 536.2,
"r_x3": 423.6,
"r_y3": 536.2,
"coord_origin": "TOPLEFT"
},
"text": "\u2192",
"orig": "\u2192",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 436.2,
"r_y0": 545.8,
"r_x1": 545.1,
"r_y1": 545.8,
"r_x2": 545.1,
"r_y2": 536.9,
"r_x3": 436.2,
"r_y3": 536.9,
"coord_origin": "TOPLEFT"
},
"text": "text-decoder\u201d (IETD), sim-",
"orig": "text-decoder\u201d (IETD), sim-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 557.7,
"r_x1": 545.1,
"r_y1": 557.7,
"r_x2": 545.1,
"r_y2": 548.8,
"r_x3": 308.9,
"r_y3": 548.8,
"coord_origin": "TOPLEFT"
},
"text": "ilar to network architectures that try to provide captions to",
"orig": "ilar to network architectures that try to provide captions to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 569.7,
"r_x1": 545.1,
"r_y1": 569.7,
"r_x2": 545.1,
"r_y2": 560.8,
"r_x3": 308.9,
"r_y3": 560.8,
"coord_origin": "TOPLEFT"
},
"text": "images [32]. In these IETD networks, one expects as output",
"orig": "images [32]. In these IETD networks, one expects as output",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 581.6,
"r_x1": 545.1,
"r_y1": 581.6,
"r_x2": 545.1,
"r_y2": 572.7,
"r_x3": 308.9,
"r_y3": 572.7,
"coord_origin": "TOPLEFT"
},
"text": "the LaTeX/HTML string of the entire table, i.e. the sym-",
"orig": "the LaTeX/HTML string of the entire table, i.e. the sym-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 593.6,
"r_x1": 545.1,
"r_y1": 593.6,
"r_x2": 545.1,
"r_y2": 584.7,
"r_x3": 308.9,
"r_y3": 584.7,
"coord_origin": "TOPLEFT"
},
"text": "bols necessary for creating the table with the content of the",
"orig": "bols necessary for creating the table with the content of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 605.6,
"r_x1": 497.1,
"r_y1": 605.6,
"r_x2": 497.1,
"r_y2": 596.6,
"r_x3": 308.9,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "table. Another approach is the \u201cimage-encoder",
"orig": "table. Another approach is the \u201cimage-encoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.8,
"r_y0": 605.3,
"r_x1": 509.8,
"r_y1": 605.3,
"r_x2": 509.8,
"r_y2": 595.9,
"r_x3": 499.8,
"r_y3": 595.9,
"coord_origin": "TOPLEFT"
},
"text": "\u2192",
"orig": "\u2192",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.5,
"r_y0": 605.6,
"r_x1": 545.1,
"r_y1": 605.6,
"r_x2": 545.1,
"r_y2": 596.6,
"r_x3": 512.5,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "dual de-",
"orig": "dual de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 617.5,
"r_x1": 545.1,
"r_y1": 617.5,
"r_x2": 545.1,
"r_y2": 608.6,
"r_x3": 308.9,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "coder\u201d (IEDD) networks. In these type of networks, one has",
"orig": "coder\u201d (IEDD) networks. In these type of networks, one has",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 629.5,
"r_x1": 545.1,
"r_y1": 629.5,
"r_x2": 545.1,
"r_y2": 620.6,
"r_x3": 308.9,
"r_y3": 620.6,
"coord_origin": "TOPLEFT"
},
"text": "two consecutive decoders with different purposes. The first",
"orig": "two consecutive decoders with different purposes. The first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 641.4,
"r_x1": 364.8,
"r_y1": 641.4,
"r_x2": 364.8,
"r_y2": 632.5,
"r_x3": 308.9,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": "decoder is the",
"orig": "decoder is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.6,
"r_y0": 641.2,
"r_x1": 415.6,
"r_y1": 641.2,
"r_x2": 415.6,
"r_y2": 632.6,
"r_x3": 367.6,
"r_y3": 632.6,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder",
"orig": "tag-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 415.6,
"r_y0": 641.4,
"r_x1": 545.1,
"r_y1": 641.4,
"r_x2": 545.1,
"r_y2": 632.5,
"r_x3": 415.6,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": ", i.e. it only produces the HTM-",
"orig": ", i.e. it only produces the HTM-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 653.4,
"r_x1": 545.1,
"r_y1": 653.4,
"r_x2": 545.1,
"r_y2": 644.5,
"r_x3": 308.9,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "L/LaTeX tags which construct an empty table. The second",
"orig": "L/LaTeX tags which construct an empty table. The second",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 665.1,
"r_x1": 373.6,
"r_y1": 665.1,
"r_x2": 373.6,
"r_y2": 656.5,
"r_x3": 308.9,
"r_y3": 656.5,
"coord_origin": "TOPLEFT"
},
"text": "content-decoder",
"orig": "content-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 376.9,
"r_y0": 665.3,
"r_x1": 545.1,
"r_y1": 665.3,
"r_x2": 545.1,
"r_y2": 656.4,
"r_x3": 376.9,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "uses the encoding of the image in combi-",
"orig": "uses the encoding of the image in combi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 677.3,
"r_x1": 545.1,
"r_y1": 677.3,
"r_x2": 545.1,
"r_y2": 668.4,
"r_x3": 308.9,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "nation with the output encoding of each cell-tag (from the",
"orig": "nation with the output encoding of each cell-tag (from the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 689.0,
"r_x1": 356.9,
"r_y1": 689.0,
"r_x2": 356.9,
"r_y2": 680.4,
"r_x3": 308.9,
"r_y3": 680.4,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder",
"orig": "tag-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.1,
"r_y0": 689.2,
"r_x1": 545.1,
"r_y1": 689.2,
"r_x2": 545.1,
"r_y2": 680.3,
"r_x3": 357.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": ") to generate the textual content of each table",
"orig": ") to generate the textual content of each table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 308.9,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "cell. The network architecture of IEDD is certainly more",
"orig": "cell. The network architecture of IEDD is certainly more",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 545.1,
"r_y1": 713.2,
"r_x2": 545.1,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "elaborate, but it has the advantage that one can pre-train the",
"orig": "elaborate, but it has the advantage that one can pre-train the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 15,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"tablestructure": {
"table_map": {}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "text",
"id": 12,
"page_no": 1,
"cluster": {
"id": 12,
"label": "text",
"bbox": {
"l": 50.1,
"t": 75.2,
"r": 286.4,
"b": 96.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.1,
"r_x1": 286.4,
"r_y1": 84.1,
"r_x2": 286.4,
"r_y2": 75.2,
"r_x3": 50.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "considered as a solved problem, given enough ground-truth",
"orig": "considered as a solved problem, given enough ground-truth",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 96.1,
"r_x1": 112.6,
"r_y1": 96.1,
"r_x2": 112.6,
"r_y2": 87.2,
"r_x3": 50.1,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "data to train on.",
"orig": "data to train on.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "considered as a solved problem, given enough ground-truth data to train on."
},
{
"label": "text",
"id": 4,
"page_no": 1,
"cluster": {
"id": 4,
"label": "text",
"bbox": {
"l": 50.1,
"t": 99.6,
"r": 286.4,
"b": 228.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 108.5,
"r_x1": 286.4,
"r_y1": 108.5,
"r_x2": 286.4,
"r_y2": 99.6,
"r_x3": 62.1,
"r_y3": 99.6,
"coord_origin": "TOPLEFT"
},
"text": "The second problem is called table-structure decompo-",
"orig": "The second problem is called table-structure decompo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 120.4,
"r_x1": 74.7,
"r_y1": 120.4,
"r_x2": 74.7,
"r_y2": 111.5,
"r_x3": 50.1,
"r_y3": 111.5,
"coord_origin": "TOPLEFT"
},
"text": "sition.",
"orig": "sition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.3,
"r_y0": 120.4,
"r_x1": 286.4,
"r_y1": 120.4,
"r_x2": 286.4,
"r_y2": 111.5,
"r_x3": 81.3,
"r_y3": 111.5,
"coord_origin": "TOPLEFT"
},
"text": "The latter is a long standing problem in the com-",
"orig": "The latter is a long standing problem in the com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 132.4,
"r_x1": 286.4,
"r_y1": 132.4,
"r_x2": 286.4,
"r_y2": 123.5,
"r_x3": 50.1,
"r_y3": 123.5,
"coord_origin": "TOPLEFT"
},
"text": "munity of document understanding [6, 4, 14]. Contrary to",
"orig": "munity of document understanding [6, 4, 14]. Contrary to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 144.3,
"r_x1": 286.4,
"r_y1": 144.3,
"r_x2": 286.4,
"r_y2": 135.4,
"r_x3": 50.1,
"r_y3": 135.4,
"coord_origin": "TOPLEFT"
},
"text": "the table-location problem, there are no commonly used ap-",
"orig": "the table-location problem, there are no commonly used ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 156.3,
"r_x1": 286.4,
"r_y1": 156.3,
"r_x2": 286.4,
"r_y2": 147.4,
"r_x3": 50.1,
"r_y3": 147.4,
"coord_origin": "TOPLEFT"
},
"text": "proaches that can easily be re-purposed to solve this prob-",
"orig": "proaches that can easily be re-purposed to solve this prob-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 168.3,
"r_x1": 286.4,
"r_y1": 168.3,
"r_x2": 286.4,
"r_y2": 159.3,
"r_x3": 50.1,
"r_y3": 159.3,
"coord_origin": "TOPLEFT"
},
"text": "lem. Lately, a set of new model-architectures has been pro-",
"orig": "lem. Lately, a set of new model-architectures has been pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 180.2,
"r_x1": 286.4,
"r_y1": 180.2,
"r_x2": 286.4,
"r_y2": 171.3,
"r_x3": 50.1,
"r_y3": 171.3,
"coord_origin": "TOPLEFT"
},
"text": "posed by the community to address table-structure decom-",
"orig": "posed by the community to address table-structure decom-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 192.2,
"r_x1": 286.4,
"r_y1": 192.2,
"r_x2": 286.4,
"r_y2": 183.3,
"r_x3": 50.1,
"r_y3": 183.3,
"coord_origin": "TOPLEFT"
},
"text": "position [37, 36, 18, 20]. All these models have some weak-",
"orig": "position [37, 36, 18, 20]. All these models have some weak-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 204.1,
"r_x1": 286.4,
"r_y1": 204.1,
"r_x2": 286.4,
"r_y2": 195.2,
"r_x3": 50.1,
"r_y3": 195.2,
"coord_origin": "TOPLEFT"
},
"text": "nesses (see Sec. 2). The common denominator here is the",
"orig": "nesses (see Sec. 2). The common denominator here is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 216.1,
"r_x1": 286.4,
"r_y1": 216.1,
"r_x2": 286.4,
"r_y2": 207.2,
"r_x3": 50.1,
"r_y3": 207.2,
"coord_origin": "TOPLEFT"
},
"text": "reliance on textual features and/or the inability to provide",
"orig": "reliance on textual features and/or the inability to provide",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 228.0,
"r_x1": 278.7,
"r_y1": 228.0,
"r_x2": 278.7,
"r_y2": 219.1,
"r_x3": 50.1,
"r_y3": 219.1,
"coord_origin": "TOPLEFT"
},
"text": "the bounding box of each table-cell in the original image.",
"orig": "the bounding box of each table-cell in the original image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The second problem is called table-structure decomposition. The latter is a long standing problem in the community of document understanding [6, 4, 14]. Contrary to the table-location problem, there are no commonly used approaches that can easily be re-purposed to solve this problem. Lately, a set of new model-architectures has been proposed by the community to address table-structure decomposition [37, 36, 18, 20]. All these models have some weaknesses (see Sec. 2). The common denominator here is the reliance on textual features and/or the inability to provide the bounding box of each table-cell in the original image."
},
{
"label": "text",
"id": 2,
"page_no": 1,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 50.1,
"t": 231.5,
"r": 286.4,
"b": 371.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 240.4,
"r_x1": 286.4,
"r_y1": 240.4,
"r_x2": 286.4,
"r_y2": 231.5,
"r_x3": 62.1,
"r_y3": 231.5,
"coord_origin": "TOPLEFT"
},
"text": "In this paper, we want to address these weaknesses and",
"orig": "In this paper, we want to address these weaknesses and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 252.4,
"r_x1": 286.4,
"r_y1": 252.4,
"r_x2": 286.4,
"r_y2": 243.5,
"r_x3": 50.1,
"r_y3": 243.5,
"coord_origin": "TOPLEFT"
},
"text": "present a robust table-structure decomposition algorithm.",
"orig": "present a robust table-structure decomposition algorithm.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 264.3,
"r_x1": 286.4,
"r_y1": 264.3,
"r_x2": 286.4,
"r_y2": 255.4,
"r_x3": 50.1,
"r_y3": 255.4,
"coord_origin": "TOPLEFT"
},
"text": "The design criteria for our model are the following. First,",
"orig": "The design criteria for our model are the following. First,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 276.3,
"r_x1": 286.4,
"r_y1": 276.3,
"r_x2": 286.4,
"r_y2": 267.4,
"r_x3": 50.1,
"r_y3": 267.4,
"coord_origin": "TOPLEFT"
},
"text": "we want our algorithm to be language agnostic. In this way,",
"orig": "we want our algorithm to be language agnostic. In this way,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 288.3,
"r_x1": 286.4,
"r_y1": 288.3,
"r_x2": 286.4,
"r_y2": 279.4,
"r_x3": 50.1,
"r_y3": 279.4,
"coord_origin": "TOPLEFT"
},
"text": "we can obtain the structure of any table, irregardless of the",
"orig": "we can obtain the structure of any table, irregardless of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 300.2,
"r_x1": 88.6,
"r_y1": 300.2,
"r_x2": 88.6,
"r_y2": 291.3,
"r_x3": 50.1,
"r_y3": 291.3,
"coord_origin": "TOPLEFT"
},
"text": "language.",
"orig": "language.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 95.5,
"r_y0": 300.2,
"r_x1": 286.4,
"r_y1": 300.2,
"r_x2": 286.4,
"r_y2": 291.3,
"r_x3": 95.5,
"r_y3": 291.3,
"coord_origin": "TOPLEFT"
},
"text": "Second, we want our algorithm to leverage as",
"orig": "Second, we want our algorithm to leverage as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 312.2,
"r_x1": 286.4,
"r_y1": 312.2,
"r_x2": 286.4,
"r_y2": 303.3,
"r_x3": 50.1,
"r_y3": 303.3,
"coord_origin": "TOPLEFT"
},
"text": "much data as possible from the original PDF document. For",
"orig": "much data as possible from the original PDF document. For",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 324.1,
"r_x1": 286.4,
"r_y1": 324.1,
"r_x2": 286.4,
"r_y2": 315.2,
"r_x3": 50.1,
"r_y3": 315.2,
"coord_origin": "TOPLEFT"
},
"text": "programmatic PDF documents, the text-cells can often be",
"orig": "programmatic PDF documents, the text-cells can often be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 336.1,
"r_x1": 286.4,
"r_y1": 336.1,
"r_x2": 286.4,
"r_y2": 327.2,
"r_x3": 50.1,
"r_y3": 327.2,
"coord_origin": "TOPLEFT"
},
"text": "extracted much faster and with higher accuracy compared",
"orig": "extracted much faster and with higher accuracy compared",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 348.0,
"r_x1": 286.4,
"r_y1": 348.0,
"r_x2": 286.4,
"r_y2": 339.1,
"r_x3": 50.1,
"r_y3": 339.1,
"coord_origin": "TOPLEFT"
},
"text": "to OCR methods. Last but not least, we want to have a di-",
"orig": "to OCR methods. Last but not least, we want to have a di-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 360.0,
"r_x1": 286.4,
"r_y1": 360.0,
"r_x2": 286.4,
"r_y2": 351.1,
"r_x3": 50.1,
"r_y3": 351.1,
"coord_origin": "TOPLEFT"
},
"text": "rect link between the table-cell and its bounding box in the",
"orig": "rect link between the table-cell and its bounding box in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 371.9,
"r_x1": 77.0,
"r_y1": 371.9,
"r_x2": 77.0,
"r_y2": 363.0,
"r_x3": 50.1,
"r_y3": 363.0,
"coord_origin": "TOPLEFT"
},
"text": "image.",
"orig": "image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "In this paper, we want to address these weaknesses and present a robust table-structure decomposition algorithm. The design criteria for our model are the following. First, we want our algorithm to be language agnostic. In this way, we can obtain the structure of any table, irregardless of the language. Second, we want our algorithm to leverage as much data as possible from the original PDF document. For programmatic PDF documents, the text-cells can often be extracted much faster and with higher accuracy compared to OCR methods. Last but not least, we want to have a direct link between the table-cell and its bounding box in the image."
},
{
"label": "text",
"id": 7,
"page_no": 1,
"cluster": {
"id": 7,
"label": "text",
"bbox": {
"l": 50.1,
"t": 375.4,
"r": 286.4,
"b": 432.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 384.4,
"r_x1": 286.4,
"r_y1": 384.4,
"r_x2": 286.4,
"r_y2": 375.4,
"r_x3": 62.1,
"r_y3": 375.4,
"coord_origin": "TOPLEFT"
},
"text": "To meet the design criteria listed above, we developed a",
"orig": "To meet the design criteria listed above, we developed a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 396.3,
"r_x1": 121.0,
"r_y1": 396.3,
"r_x2": 121.0,
"r_y2": 387.4,
"r_x3": 50.1,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "new model called",
"orig": "new model called",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 123.9,
"r_y0": 396.2,
"r_x1": 179.7,
"r_y1": 396.2,
"r_x2": 179.7,
"r_y2": 387.3,
"r_x3": 123.9,
"r_y3": 387.3,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.6,
"r_y0": 396.3,
"r_x1": 286.4,
"r_y1": 396.3,
"r_x2": 286.4,
"r_y2": 387.4,
"r_x3": 182.6,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "and a synthetically gener-",
"orig": "and a synthetically gener-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 408.3,
"r_x1": 181.8,
"r_y1": 408.3,
"r_x2": 181.8,
"r_y2": 399.4,
"r_x3": 50.1,
"r_y3": 399.4,
"coord_origin": "TOPLEFT"
},
"text": "ated table structure dataset called",
"orig": "ated table structure dataset called",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.1,
"r_y0": 408.2,
"r_x1": 240.2,
"r_y1": 408.2,
"r_x2": 240.2,
"r_y2": 399.2,
"r_x3": 184.1,
"r_y3": 399.2,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 240.2,
"r_y0": 408.3,
"r_x1": 286.4,
"r_y1": 408.3,
"r_x2": 286.4,
"r_y2": 399.4,
"r_x3": 240.2,
"r_y3": 399.4,
"coord_origin": "TOPLEFT"
},
"text": "$^{1}$. In partic-",
"orig": "$^{1}$. In partic-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 420.2,
"r_x1": 286.4,
"r_y1": 420.2,
"r_x2": 286.4,
"r_y2": 411.3,
"r_x3": 50.1,
"r_y3": 411.3,
"coord_origin": "TOPLEFT"
},
"text": "ular, our contributions in this work can be summarised as",
"orig": "ular, our contributions in this work can be summarised as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 432.2,
"r_x1": 82.5,
"r_y1": 432.2,
"r_x2": 82.5,
"r_y2": 423.3,
"r_x3": 50.1,
"r_y3": 423.3,
"coord_origin": "TOPLEFT"
},
"text": "follows:",
"orig": "follows:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "To meet the design criteria listed above, we developed a new model called TableFormer and a synthetically generated table structure dataset called SynthTabNet $^{1}$. In particular, our contributions in this work can be summarised as follows:"
},
{
"label": "list_item",
"id": 6,
"page_no": 1,
"cluster": {
"id": 6,
"label": "list_item",
"bbox": {
"l": 61.6,
"t": 444.4,
"r": 286.4,
"b": 489.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 453.5,
"r_x1": 70.7,
"r_y1": 453.5,
"r_x2": 70.7,
"r_y2": 444.6,
"r_x3": 61.6,
"r_y3": 444.6,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.0,
"r_y0": 453.5,
"r_x1": 117.1,
"r_y1": 453.5,
"r_x2": 117.1,
"r_y2": 444.6,
"r_x3": 73.0,
"r_y3": 444.6,
"coord_origin": "TOPLEFT"
},
"text": "We propose",
"orig": "We propose",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.6,
"r_y0": 453.4,
"r_x1": 175.4,
"r_y1": 453.4,
"r_x2": 175.4,
"r_y2": 444.4,
"r_x3": 119.6,
"r_y3": 444.4,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.4,
"r_y0": 453.5,
"r_x1": 286.4,
"r_y1": 453.5,
"r_x2": 286.4,
"r_y2": 444.6,
"r_x3": 175.4,
"r_y3": 444.6,
"coord_origin": "TOPLEFT"
},
"text": ", a transformer based model",
"orig": ", a transformer based model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 465.4,
"r_x1": 286.4,
"r_y1": 465.4,
"r_x2": 286.4,
"r_y2": 456.5,
"r_x3": 70.0,
"r_y3": 456.5,
"coord_origin": "TOPLEFT"
},
"text": "that predicts tables structure and bounding boxes for",
"orig": "that predicts tables structure and bounding boxes for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 477.4,
"r_x1": 286.4,
"r_y1": 477.4,
"r_x2": 286.4,
"r_y2": 468.5,
"r_x3": 70.0,
"r_y3": 468.5,
"coord_origin": "TOPLEFT"
},
"text": "the table content simultaneously in an end-to-end ap-",
"orig": "the table content simultaneously in an end-to-end ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 489.3,
"r_x1": 99.6,
"r_y1": 489.3,
"r_x2": 99.6,
"r_y2": 480.4,
"r_x3": 70.0,
"r_y3": 480.4,
"coord_origin": "TOPLEFT"
},
"text": "proach.",
"orig": "proach.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 We propose TableFormer , a transformer based model that predicts tables structure and bounding boxes for the table content simultaneously in an end-to-end approach."
},
{
"label": "list_item",
"id": 5,
"page_no": 1,
"cluster": {
"id": 5,
"label": "list_item",
"bbox": {
"l": 61.6,
"t": 502.0,
"r": 286.4,
"b": 546.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 511.1,
"r_x1": 71.6,
"r_y1": 511.1,
"r_x2": 71.6,
"r_y2": 502.2,
"r_x3": 61.6,
"r_y3": 502.2,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.1,
"r_y0": 511.1,
"r_x1": 196.1,
"r_y1": 511.1,
"r_x2": 196.1,
"r_y2": 502.2,
"r_x3": 74.1,
"r_y3": 502.2,
"coord_origin": "TOPLEFT"
},
"text": "Across all benchmark datasets",
"orig": "Across all benchmark datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.3,
"r_y0": 511.0,
"r_x1": 256.1,
"r_y1": 511.0,
"r_x2": 256.1,
"r_y2": 502.0,
"r_x3": 200.3,
"r_y3": 502.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 260.4,
"r_y0": 511.1,
"r_x1": 286.4,
"r_y1": 511.1,
"r_x2": 286.4,
"r_y2": 502.2,
"r_x3": 260.4,
"r_y3": 502.2,
"coord_origin": "TOPLEFT"
},
"text": "signif-",
"orig": "signif-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 523.0,
"r_x1": 286.4,
"r_y1": 523.0,
"r_x2": 286.4,
"r_y2": 514.1,
"r_x3": 70.0,
"r_y3": 514.1,
"coord_origin": "TOPLEFT"
},
"text": "icantly outperforms existing state-of-the-art metrics,",
"orig": "icantly outperforms existing state-of-the-art metrics,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 535.0,
"r_x1": 286.4,
"r_y1": 535.0,
"r_x2": 286.4,
"r_y2": 526.1,
"r_x3": 70.0,
"r_y3": 526.1,
"coord_origin": "TOPLEFT"
},
"text": "while being much more efficient in training and infer-",
"orig": "while being much more efficient in training and infer-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 546.9,
"r_x1": 161.7,
"r_y1": 546.9,
"r_x2": 161.7,
"r_y2": 538.0,
"r_x3": 70.0,
"r_y3": 538.0,
"coord_origin": "TOPLEFT"
},
"text": "ence to existing works.",
"orig": "ence to existing works.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 Across all benchmark datasets TableFormer significantly outperforms existing state-of-the-art metrics, while being much more efficient in training and inference to existing works."
},
{
"label": "list_item",
"id": 9,
"page_no": 1,
"cluster": {
"id": 9,
"label": "list_item",
"bbox": {
"l": 61.6,
"t": 559.6,
"r": 286.4,
"b": 592.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 568.7,
"r_x1": 71.1,
"r_y1": 568.7,
"r_x2": 71.1,
"r_y2": 559.8,
"r_x3": 61.6,
"r_y3": 559.8,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.5,
"r_y0": 568.7,
"r_x1": 116.7,
"r_y1": 568.7,
"r_x2": 116.7,
"r_y2": 559.8,
"r_x3": 73.5,
"r_y3": 559.8,
"coord_origin": "TOPLEFT"
},
"text": "We present",
"orig": "We present",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 121.6,
"r_y0": 568.6,
"r_x1": 177.7,
"r_y1": 568.6,
"r_x2": 177.7,
"r_y2": 559.6,
"r_x3": 121.6,
"r_y3": 559.6,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.6,
"r_y0": 568.7,
"r_x1": 286.4,
"r_y1": 568.7,
"r_x2": 286.4,
"r_y2": 559.8,
"r_x3": 182.6,
"r_y3": 559.8,
"coord_origin": "TOPLEFT"
},
"text": "a synthetically generated",
"orig": "a synthetically generated",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 580.6,
"r_x1": 286.4,
"r_y1": 580.6,
"r_x2": 286.4,
"r_y2": 571.7,
"r_x3": 70.0,
"r_y3": 571.7,
"coord_origin": "TOPLEFT"
},
"text": "dataset, with various appearance styles and complex-",
"orig": "dataset, with various appearance styles and complex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 592.6,
"r_x1": 82.4,
"r_y1": 592.6,
"r_x2": 82.4,
"r_y2": 583.7,
"r_x3": 70.0,
"r_y3": 583.7,
"coord_origin": "TOPLEFT"
},
"text": "ity.",
"orig": "ity.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 We present SynthTabNet a synthetically generated dataset, with various appearance styles and complexity."
},
{
"label": "list_item",
"id": 8,
"page_no": 1,
"cluster": {
"id": 8,
"label": "list_item",
"bbox": {
"l": 61.6,
"t": 605.4,
"r": 286.4,
"b": 638.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 614.3,
"r_x1": 72.3,
"r_y1": 614.3,
"r_x2": 72.3,
"r_y2": 605.4,
"r_x3": 61.6,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 75.0,
"r_y0": 614.3,
"r_x1": 286.4,
"r_y1": 614.3,
"r_x2": 286.4,
"r_y2": 605.4,
"r_x3": 75.0,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "An augmented dataset based on PubTabNet [37],",
"orig": "An augmented dataset based on PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 626.3,
"r_x1": 286.4,
"r_y1": 626.3,
"r_x2": 286.4,
"r_y2": 617.4,
"r_x3": 70.0,
"r_y3": 617.4,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet [36], and TableBank [17] with generated",
"orig": "FinTabNet [36], and TableBank [17] with generated",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 638.2,
"r_x1": 198.1,
"r_y1": 638.2,
"r_x2": 198.1,
"r_y2": 629.3,
"r_x3": 70.0,
"r_y3": 629.3,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth for reproducibility.",
"orig": "ground-truth for reproducibility.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 An augmented dataset based on PubTabNet [37], FinTabNet [36], and TableBank [17] with generated ground-truth for reproducibility."
},
{
"label": "text",
"id": 11,
"page_no": 1,
"cluster": {
"id": 11,
"label": "text",
"bbox": {
"l": 50.1,
"t": 650.6,
"r": 286.4,
"b": 695.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 659.5,
"r_x1": 286.4,
"r_y1": 659.5,
"r_x2": 286.4,
"r_y2": 650.6,
"r_x3": 62.1,
"r_y3": 650.6,
"coord_origin": "TOPLEFT"
},
"text": "The paper is structured as follows. In Sec. 2, we give",
"orig": "The paper is structured as follows. In Sec. 2, we give",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 671.5,
"r_x1": 286.4,
"r_y1": 671.5,
"r_x2": 286.4,
"r_y2": 662.6,
"r_x3": 50.1,
"r_y3": 662.6,
"coord_origin": "TOPLEFT"
},
"text": "a brief overview of the current state-of-the-art. In Sec. 3,",
"orig": "a brief overview of the current state-of-the-art. In Sec. 3,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 683.4,
"r_x1": 286.4,
"r_y1": 683.4,
"r_x2": 286.4,
"r_y2": 674.5,
"r_x3": 50.1,
"r_y3": 674.5,
"coord_origin": "TOPLEFT"
},
"text": "we describe the datasets on which we train. In Sec. 4, we",
"orig": "we describe the datasets on which we train. In Sec. 4, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 695.4,
"r_x1": 286.4,
"r_y1": 695.4,
"r_x2": 286.4,
"r_y2": 686.5,
"r_x3": 50.1,
"r_y3": 686.5,
"coord_origin": "TOPLEFT"
},
"text": "introduce the TableFormer model-architecture and describe",
"orig": "introduce the TableFormer model-architecture and describe",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The paper is structured as follows. In Sec. 2, we give a brief overview of the current state-of-the-art. In Sec. 3, we describe the datasets on which we train. In Sec. 4, we introduce the TableFormer model-architecture and describe"
},
{
"label": "footnote",
"id": 14,
"page_no": 1,
"cluster": {
"id": 14,
"label": "footnote",
"bbox": {
"l": 61.0,
"t": 705.6,
"r": 183.7,
"b": 712.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.0,
"r_y0": 712.7,
"r_x1": 183.7,
"r_y1": 712.7,
"r_x2": 183.7,
"r_y2": 705.6,
"r_x3": 61.0,
"r_y3": 705.6,
"coord_origin": "TOPLEFT"
},
"text": "$^{1}$https://github.com/IBM/SynthTabNet",
"orig": "$^{1}$https://github.com/IBM/SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "$^{1}$https://github.com/IBM/SynthTabNet"
},
{
"label": "text",
"id": 10,
"page_no": 1,
"cluster": {
"id": 10,
"label": "text",
"bbox": {
"l": 308.9,
"t": 75.2,
"r": 545.1,
"b": 108.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 84.1,
"r_x1": 545.1,
"r_y1": 84.1,
"r_x2": 545.1,
"r_y2": 75.2,
"r_x3": 308.9,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "its results & performance in Sec. 5. As a conclusion, we de-",
"orig": "its results & performance in Sec. 5. As a conclusion, we de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 96.1,
"r_x1": 545.1,
"r_y1": 96.1,
"r_x2": 545.1,
"r_y2": 87.2,
"r_x3": 308.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "scribe how this new model-architecture can be re-purposed",
"orig": "scribe how this new model-architecture can be re-purposed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 108.0,
"r_x1": 508.1,
"r_y1": 108.0,
"r_x2": 508.1,
"r_y2": 99.1,
"r_x3": 308.9,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "for other tasks in the computer-vision community.",
"orig": "for other tasks in the computer-vision community.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "its results & performance in Sec. 5. As a conclusion, we describe how this new model-architecture can be re-purposed for other tasks in the computer-vision community."
},
{
"label": "section_header",
"id": 13,
"page_no": 1,
"cluster": {
"id": 13,
"label": "section_header",
"bbox": {
"l": 308.9,
"t": 121.7,
"r": 498.3,
"b": 132.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 132.5,
"r_x1": 315.6,
"r_y1": 132.5,
"r_x2": 315.6,
"r_y2": 121.7,
"r_x3": 308.9,
"r_y3": 121.7,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 324.5,
"r_y0": 132.5,
"r_x1": 498.3,
"r_y1": 132.5,
"r_x2": 498.3,
"r_y2": 121.7,
"r_x3": 324.5,
"r_y3": 121.7,
"coord_origin": "TOPLEFT"
},
"text": "Previous work and State of the Art",
"orig": "Previous work and State of the Art",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "2. Previous work and State of the Art"
},
{
"label": "text",
"id": 0,
"page_no": 1,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 308.9,
"t": 142.2,
"r": 545.1,
"b": 330.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 151.1,
"r_x1": 545.1,
"r_y1": 151.1,
"r_x2": 545.1,
"r_y2": 142.2,
"r_x3": 320.8,
"r_y3": 142.2,
"coord_origin": "TOPLEFT"
},
"text": "Identifying the structure of a table has been an outstand-",
"orig": "Identifying the structure of a table has been an outstand-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 163.1,
"r_x1": 545.1,
"r_y1": 163.1,
"r_x2": 545.1,
"r_y2": 154.2,
"r_x3": 308.9,
"r_y3": 154.2,
"coord_origin": "TOPLEFT"
},
"text": "ing problem in the document-parsing community, that mo-",
"orig": "ing problem in the document-parsing community, that mo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 175.0,
"r_x1": 522.6,
"r_y1": 175.0,
"r_x2": 522.6,
"r_y2": 166.1,
"r_x3": 308.9,
"r_y3": 166.1,
"coord_origin": "TOPLEFT"
},
"text": "tivates many organised public challenges [6, 4, 14].",
"orig": "tivates many organised public challenges [6, 4, 14].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 529.6,
"r_y0": 175.0,
"r_x1": 545.1,
"r_y1": 175.0,
"r_x2": 545.1,
"r_y2": 166.1,
"r_x3": 529.6,
"r_y3": 166.1,
"coord_origin": "TOPLEFT"
},
"text": "The",
"orig": "The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 187.0,
"r_x1": 545.1,
"r_y1": 187.0,
"r_x2": 545.1,
"r_y2": 178.1,
"r_x3": 308.9,
"r_y3": 178.1,
"coord_origin": "TOPLEFT"
},
"text": "difficulty of the problem can be attributed to a number of",
"orig": "difficulty of the problem can be attributed to a number of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 198.9,
"r_x1": 545.1,
"r_y1": 198.9,
"r_x2": 545.1,
"r_y2": 190.0,
"r_x3": 308.9,
"r_y3": 190.0,
"coord_origin": "TOPLEFT"
},
"text": "factors. First, there is a large variety in the shapes and sizes",
"orig": "factors. First, there is a large variety in the shapes and sizes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 210.9,
"r_x1": 347.0,
"r_y1": 210.9,
"r_x2": 347.0,
"r_y2": 202.0,
"r_x3": 308.9,
"r_y3": 202.0,
"coord_origin": "TOPLEFT"
},
"text": "of tables.",
"orig": "of tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.9,
"r_y0": 210.9,
"r_x1": 545.1,
"r_y1": 210.9,
"r_x2": 545.1,
"r_y2": 202.0,
"r_x3": 354.9,
"r_y3": 202.0,
"coord_origin": "TOPLEFT"
},
"text": "Such large variety requires a flexible method.",
"orig": "Such large variety requires a flexible method.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 222.9,
"r_x1": 545.1,
"r_y1": 222.9,
"r_x2": 545.1,
"r_y2": 214.0,
"r_x3": 308.9,
"r_y3": 214.0,
"coord_origin": "TOPLEFT"
},
"text": "This is especially true for complex column- and row head-",
"orig": "This is especially true for complex column- and row head-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 234.8,
"r_x1": 530.9,
"r_y1": 234.8,
"r_x2": 530.9,
"r_y2": 225.9,
"r_x3": 308.9,
"r_y3": 225.9,
"coord_origin": "TOPLEFT"
},
"text": "ers, which can be extremely intricate and demanding.",
"orig": "ers, which can be extremely intricate and demanding.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 537.9,
"r_y0": 234.8,
"r_x1": 545.1,
"r_y1": 234.8,
"r_x2": 545.1,
"r_y2": 225.9,
"r_x3": 537.9,
"r_y3": 225.9,
"coord_origin": "TOPLEFT"
},
"text": "A",
"orig": "A",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 246.8,
"r_x1": 545.1,
"r_y1": 246.8,
"r_x2": 545.1,
"r_y2": 237.9,
"r_x3": 308.9,
"r_y3": 237.9,
"coord_origin": "TOPLEFT"
},
"text": "second factor of complexity is the lack of data with regard",
"orig": "second factor of complexity is the lack of data with regard",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 258.7,
"r_x1": 545.1,
"r_y1": 258.7,
"r_x2": 545.1,
"r_y2": 249.8,
"r_x3": 308.9,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "to table-structure. Until the publication of PubTabNet [37],",
"orig": "to table-structure. Until the publication of PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 270.7,
"r_x1": 439.8,
"r_y1": 270.7,
"r_x2": 439.8,
"r_y2": 261.8,
"r_x3": 308.9,
"r_y3": 261.8,
"coord_origin": "TOPLEFT"
},
"text": "there were no large datasets (i.e.",
"orig": "there were no large datasets (i.e.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 444.4,
"r_y0": 270.5,
"r_x1": 452.2,
"r_y1": 270.5,
"r_x2": 452.2,
"r_y2": 261.6,
"r_x3": 444.4,
"r_y3": 261.6,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.9,
"r_y0": 270.5,
"r_x1": 470.8,
"r_y1": 270.5,
"r_x2": 470.8,
"r_y2": 261.6,
"r_x3": 455.9,
"r_y3": 261.6,
"coord_origin": "TOPLEFT"
},
"text": "100",
"orig": "100",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 470.8,
"r_y0": 270.7,
"r_x1": 545.1,
"r_y1": 270.7,
"r_x2": 545.1,
"r_y2": 261.8,
"r_x3": 470.8,
"r_y3": 261.8,
"coord_origin": "TOPLEFT"
},
"text": "K tables) that pro-",
"orig": "K tables) that pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 282.6,
"r_x1": 545.1,
"r_y1": 282.6,
"r_x2": 545.1,
"r_y2": 273.7,
"r_x3": 308.9,
"r_y3": 273.7,
"coord_origin": "TOPLEFT"
},
"text": "vided structure information. This happens primarily due to",
"orig": "vided structure information. This happens primarily due to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 294.6,
"r_x1": 545.1,
"r_y1": 294.6,
"r_x2": 545.1,
"r_y2": 285.7,
"r_x3": 308.9,
"r_y3": 285.7,
"coord_origin": "TOPLEFT"
},
"text": "the fact that tables are notoriously time-consuming to an-",
"orig": "the fact that tables are notoriously time-consuming to an-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 306.5,
"r_x1": 545.1,
"r_y1": 306.5,
"r_x2": 545.1,
"r_y2": 297.6,
"r_x3": 308.9,
"r_y3": 297.6,
"coord_origin": "TOPLEFT"
},
"text": "notate by hand. However, this has definitely changed in re-",
"orig": "notate by hand. However, this has definitely changed in re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 318.5,
"r_x1": 545.1,
"r_y1": 318.5,
"r_x2": 545.1,
"r_y2": 309.6,
"r_x3": 308.9,
"r_y3": 309.6,
"coord_origin": "TOPLEFT"
},
"text": "cent years with the deliverance of PubTabNet [37], FinTab-",
"orig": "cent years with the deliverance of PubTabNet [37], FinTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 330.5,
"r_x1": 425.9,
"r_y1": 330.5,
"r_x2": 425.9,
"r_y2": 321.5,
"r_x3": 308.9,
"r_y3": 321.5,
"coord_origin": "TOPLEFT"
},
"text": "Net [36], TableBank [17] etc.",
"orig": "Net [36], TableBank [17] etc.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Identifying the structure of a table has been an outstanding problem in the document-parsing community, that motivates many organised public challenges [6, 4, 14]. The difficulty of the problem can be attributed to a number of factors. First, there is a large variety in the shapes and sizes of tables. Such large variety requires a flexible method. This is especially true for complex column- and row headers, which can be extremely intricate and demanding. A second factor of complexity is the lack of data with regard to table-structure. Until the publication of PubTabNet [37], there were no large datasets (i.e. > 100 K tables) that provided structure information. This happens primarily due to the fact that tables are notoriously time-consuming to annotate by hand. However, this has definitely changed in recent years with the deliverance of PubTabNet [37], FinTabNet [36], TableBank [17] etc."
},
{
"label": "text",
"id": 1,
"page_no": 1,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 308.9,
"t": 333.6,
"r": 545.1,
"b": 450.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 342.5,
"r_x1": 545.1,
"r_y1": 342.5,
"r_x2": 545.1,
"r_y2": 333.6,
"r_x3": 320.8,
"r_y3": 333.6,
"coord_origin": "TOPLEFT"
},
"text": "Before the rising popularity of deep neural networks,",
"orig": "Before the rising popularity of deep neural networks,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 354.4,
"r_x1": 545.1,
"r_y1": 354.4,
"r_x2": 545.1,
"r_y2": 345.5,
"r_x3": 308.9,
"r_y3": 345.5,
"coord_origin": "TOPLEFT"
},
"text": "the community relied heavily on heuristic and/or statistical",
"orig": "the community relied heavily on heuristic and/or statistical",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 366.4,
"r_x1": 545.1,
"r_y1": 366.4,
"r_x2": 545.1,
"r_y2": 357.5,
"r_x3": 308.9,
"r_y3": 357.5,
"coord_origin": "TOPLEFT"
},
"text": "methods to do table structure identification [3, 7, 11, 5, 13,",
"orig": "methods to do table structure identification [3, 7, 11, 5, 13,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 378.3,
"r_x1": 545.1,
"r_y1": 378.3,
"r_x2": 545.1,
"r_y2": 369.4,
"r_x3": 308.9,
"r_y3": 369.4,
"coord_origin": "TOPLEFT"
},
"text": "28]. Although such methods work well on constrained ta-",
"orig": "28]. Although such methods work well on constrained ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 390.3,
"r_x1": 545.1,
"r_y1": 390.3,
"r_x2": 545.1,
"r_y2": 381.4,
"r_x3": 308.9,
"r_y3": 381.4,
"coord_origin": "TOPLEFT"
},
"text": "bles [12], a more data-driven approach can be applied due",
"orig": "bles [12], a more data-driven approach can be applied due",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 402.3,
"r_x1": 545.1,
"r_y1": 402.3,
"r_x2": 545.1,
"r_y2": 393.3,
"r_x3": 308.9,
"r_y3": 393.3,
"coord_origin": "TOPLEFT"
},
"text": "to the advent of convolutional neural networks (CNNs) and",
"orig": "to the advent of convolutional neural networks (CNNs) and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 414.2,
"r_x1": 545.1,
"r_y1": 414.2,
"r_x2": 545.1,
"r_y2": 405.3,
"r_x3": 308.9,
"r_y3": 405.3,
"coord_origin": "TOPLEFT"
},
"text": "the availability of large datasets. To the best-of-our knowl-",
"orig": "the availability of large datasets. To the best-of-our knowl-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 426.2,
"r_x1": 545.1,
"r_y1": 426.2,
"r_x2": 545.1,
"r_y2": 417.3,
"r_x3": 308.9,
"r_y3": 417.3,
"coord_origin": "TOPLEFT"
},
"text": "edge, there are currently two different types of network ar-",
"orig": "edge, there are currently two different types of network ar-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 438.1,
"r_x1": 545.1,
"r_y1": 438.1,
"r_x2": 545.1,
"r_y2": 429.2,
"r_x3": 308.9,
"r_y3": 429.2,
"coord_origin": "TOPLEFT"
},
"text": "chitecture that are being pursued for state-of-the-art table-",
"orig": "chitecture that are being pursued for state-of-the-art table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 450.1,
"r_x1": 401.3,
"r_y1": 450.1,
"r_x2": 401.3,
"r_y2": 441.2,
"r_x3": 308.9,
"r_y3": 441.2,
"coord_origin": "TOPLEFT"
},
"text": "structure identification.",
"orig": "structure identification.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Before the rising popularity of deep neural networks, the community relied heavily on heuristic and/or statistical methods to do table structure identification [3, 7, 11, 5, 13, 28]. Although such methods work well on constrained tables [12], a more data-driven approach can be applied due to the advent of convolutional neural networks (CNNs) and the availability of large datasets. To the best-of-our knowledge, there are currently two different types of network architecture that are being pursued for state-of-the-art tablestructure identification."
},
{
"label": "text",
"id": 3,
"page_no": 1,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 308.9,
"t": 453.1,
"r": 545.1,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 462.0,
"r_x1": 423.3,
"r_y1": 462.0,
"r_x2": 423.3,
"r_y2": 453.1,
"r_x3": 320.8,
"r_y3": 453.1,
"coord_origin": "TOPLEFT"
},
"text": "Image-to-Text networks",
"orig": "Image-to-Text networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 423.3,
"r_y0": 462.1,
"r_x1": 545.1,
"r_y1": 462.1,
"r_x2": 545.1,
"r_y2": 453.2,
"r_x3": 423.3,
"r_y3": 453.2,
"coord_origin": "TOPLEFT"
},
"text": ": In this type of network, one",
"orig": ": In this type of network, one",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 474.0,
"r_x1": 545.1,
"r_y1": 474.0,
"r_x2": 545.1,
"r_y2": 465.1,
"r_x3": 308.9,
"r_y3": 465.1,
"coord_origin": "TOPLEFT"
},
"text": "predicts a sequence of tokens starting from an encoded",
"orig": "predicts a sequence of tokens starting from an encoded",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 486.0,
"r_x1": 335.7,
"r_y1": 486.0,
"r_x2": 335.7,
"r_y2": 477.1,
"r_x3": 308.9,
"r_y3": 477.1,
"coord_origin": "TOPLEFT"
},
"text": "image.",
"orig": "image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.9,
"r_y0": 486.0,
"r_x1": 545.1,
"r_y1": 486.0,
"r_x2": 545.1,
"r_y2": 477.1,
"r_x3": 345.9,
"r_y3": 477.1,
"coord_origin": "TOPLEFT"
},
"text": "Such sequences of tokens can be HTML table",
"orig": "Such sequences of tokens can be HTML table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 498.0,
"r_x1": 545.1,
"r_y1": 498.0,
"r_x2": 545.1,
"r_y2": 489.1,
"r_x3": 308.9,
"r_y3": 489.1,
"coord_origin": "TOPLEFT"
},
"text": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-",
"orig": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 509.9,
"r_x1": 545.1,
"r_y1": 509.9,
"r_x2": 545.1,
"r_y2": 501.0,
"r_x3": 308.9,
"r_y3": 501.0,
"coord_origin": "TOPLEFT"
},
"text": "bols is ultimately not very important, since one can be trans-",
"orig": "bols is ultimately not very important, since one can be trans-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 521.9,
"r_x1": 545.1,
"r_y1": 521.9,
"r_x2": 545.1,
"r_y2": 513.0,
"r_x3": 308.9,
"r_y3": 513.0,
"coord_origin": "TOPLEFT"
},
"text": "formed into the other. There are however subtle variations",
"orig": "formed into the other. There are however subtle variations",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 533.8,
"r_x1": 545.1,
"r_y1": 533.8,
"r_x2": 545.1,
"r_y2": 524.9,
"r_x3": 308.9,
"r_y3": 524.9,
"coord_origin": "TOPLEFT"
},
"text": "in the Image-to-Text networks. The easiest network archi-",
"orig": "in the Image-to-Text networks. The easiest network archi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 545.8,
"r_x1": 420.9,
"r_y1": 545.8,
"r_x2": 420.9,
"r_y2": 536.9,
"r_x3": 308.9,
"r_y3": 536.9,
"coord_origin": "TOPLEFT"
},
"text": "tectures are \u201cimage-encoder",
"orig": "tectures are \u201cimage-encoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 423.6,
"r_y0": 545.6,
"r_x1": 433.6,
"r_y1": 545.6,
"r_x2": 433.6,
"r_y2": 536.2,
"r_x3": 423.6,
"r_y3": 536.2,
"coord_origin": "TOPLEFT"
},
"text": "\u2192",
"orig": "\u2192",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 436.2,
"r_y0": 545.8,
"r_x1": 545.1,
"r_y1": 545.8,
"r_x2": 545.1,
"r_y2": 536.9,
"r_x3": 436.2,
"r_y3": 536.9,
"coord_origin": "TOPLEFT"
},
"text": "text-decoder\u201d (IETD), sim-",
"orig": "text-decoder\u201d (IETD), sim-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 557.7,
"r_x1": 545.1,
"r_y1": 557.7,
"r_x2": 545.1,
"r_y2": 548.8,
"r_x3": 308.9,
"r_y3": 548.8,
"coord_origin": "TOPLEFT"
},
"text": "ilar to network architectures that try to provide captions to",
"orig": "ilar to network architectures that try to provide captions to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 569.7,
"r_x1": 545.1,
"r_y1": 569.7,
"r_x2": 545.1,
"r_y2": 560.8,
"r_x3": 308.9,
"r_y3": 560.8,
"coord_origin": "TOPLEFT"
},
"text": "images [32]. In these IETD networks, one expects as output",
"orig": "images [32]. In these IETD networks, one expects as output",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 581.6,
"r_x1": 545.1,
"r_y1": 581.6,
"r_x2": 545.1,
"r_y2": 572.7,
"r_x3": 308.9,
"r_y3": 572.7,
"coord_origin": "TOPLEFT"
},
"text": "the LaTeX/HTML string of the entire table, i.e. the sym-",
"orig": "the LaTeX/HTML string of the entire table, i.e. the sym-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 593.6,
"r_x1": 545.1,
"r_y1": 593.6,
"r_x2": 545.1,
"r_y2": 584.7,
"r_x3": 308.9,
"r_y3": 584.7,
"coord_origin": "TOPLEFT"
},
"text": "bols necessary for creating the table with the content of the",
"orig": "bols necessary for creating the table with the content of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 605.6,
"r_x1": 497.1,
"r_y1": 605.6,
"r_x2": 497.1,
"r_y2": 596.6,
"r_x3": 308.9,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "table. Another approach is the \u201cimage-encoder",
"orig": "table. Another approach is the \u201cimage-encoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.8,
"r_y0": 605.3,
"r_x1": 509.8,
"r_y1": 605.3,
"r_x2": 509.8,
"r_y2": 595.9,
"r_x3": 499.8,
"r_y3": 595.9,
"coord_origin": "TOPLEFT"
},
"text": "\u2192",
"orig": "\u2192",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.5,
"r_y0": 605.6,
"r_x1": 545.1,
"r_y1": 605.6,
"r_x2": 545.1,
"r_y2": 596.6,
"r_x3": 512.5,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "dual de-",
"orig": "dual de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 617.5,
"r_x1": 545.1,
"r_y1": 617.5,
"r_x2": 545.1,
"r_y2": 608.6,
"r_x3": 308.9,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "coder\u201d (IEDD) networks. In these type of networks, one has",
"orig": "coder\u201d (IEDD) networks. In these type of networks, one has",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 629.5,
"r_x1": 545.1,
"r_y1": 629.5,
"r_x2": 545.1,
"r_y2": 620.6,
"r_x3": 308.9,
"r_y3": 620.6,
"coord_origin": "TOPLEFT"
},
"text": "two consecutive decoders with different purposes. The first",
"orig": "two consecutive decoders with different purposes. The first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 641.4,
"r_x1": 364.8,
"r_y1": 641.4,
"r_x2": 364.8,
"r_y2": 632.5,
"r_x3": 308.9,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": "decoder is the",
"orig": "decoder is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.6,
"r_y0": 641.2,
"r_x1": 415.6,
"r_y1": 641.2,
"r_x2": 415.6,
"r_y2": 632.6,
"r_x3": 367.6,
"r_y3": 632.6,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder",
"orig": "tag-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 415.6,
"r_y0": 641.4,
"r_x1": 545.1,
"r_y1": 641.4,
"r_x2": 545.1,
"r_y2": 632.5,
"r_x3": 415.6,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": ", i.e. it only produces the HTM-",
"orig": ", i.e. it only produces the HTM-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 653.4,
"r_x1": 545.1,
"r_y1": 653.4,
"r_x2": 545.1,
"r_y2": 644.5,
"r_x3": 308.9,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "L/LaTeX tags which construct an empty table. The second",
"orig": "L/LaTeX tags which construct an empty table. The second",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 665.1,
"r_x1": 373.6,
"r_y1": 665.1,
"r_x2": 373.6,
"r_y2": 656.5,
"r_x3": 308.9,
"r_y3": 656.5,
"coord_origin": "TOPLEFT"
},
"text": "content-decoder",
"orig": "content-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 376.9,
"r_y0": 665.3,
"r_x1": 545.1,
"r_y1": 665.3,
"r_x2": 545.1,
"r_y2": 656.4,
"r_x3": 376.9,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "uses the encoding of the image in combi-",
"orig": "uses the encoding of the image in combi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 677.3,
"r_x1": 545.1,
"r_y1": 677.3,
"r_x2": 545.1,
"r_y2": 668.4,
"r_x3": 308.9,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "nation with the output encoding of each cell-tag (from the",
"orig": "nation with the output encoding of each cell-tag (from the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 689.0,
"r_x1": 356.9,
"r_y1": 689.0,
"r_x2": 356.9,
"r_y2": 680.4,
"r_x3": 308.9,
"r_y3": 680.4,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder",
"orig": "tag-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.1,
"r_y0": 689.2,
"r_x1": 545.1,
"r_y1": 689.2,
"r_x2": 545.1,
"r_y2": 680.3,
"r_x3": 357.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": ") to generate the textual content of each table",
"orig": ") to generate the textual content of each table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 308.9,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "cell. The network architecture of IEDD is certainly more",
"orig": "cell. The network architecture of IEDD is certainly more",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 545.1,
"r_y1": 713.2,
"r_x2": 545.1,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "elaborate, but it has the advantage that one can pre-train the",
"orig": "elaborate, but it has the advantage that one can pre-train the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Image-to-Text networks : In this type of network, one predicts a sequence of tokens starting from an encoded image. Such sequences of tokens can be HTML table tags [37, 17] or LaTeX symbols[10]. The choice of symbols is ultimately not very important, since one can be transformed into the other. There are however subtle variations in the Image-to-Text networks. The easiest network architectures are \"image-encoder \u2192 text-decoder\" (IETD), similar to network architectures that try to provide captions to images [32]. In these IETD networks, one expects as output the LaTeX/HTML string of the entire table, i.e. the symbols necessary for creating the table with the content of the table. Another approach is the \"image-encoder \u2192 dual decoder\" (IEDD) networks. In these type of networks, one has two consecutive decoders with different purposes. The first decoder is the tag-decoder , i.e. it only produces the HTML/LaTeX tags which construct an empty table. The second content-decoder uses the encoding of the image in combination with the output encoding of each cell-tag (from the tag-decoder ) to generate the textual content of each table cell. The network architecture of IEDD is certainly more elaborate, but it has the advantage that one can pre-train the"
},
{
"label": "page_footer",
"id": 15,
"page_no": 1,
"cluster": {
"id": 15,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "2"
}
],
"body": [
{
"label": "text",
"id": 12,
"page_no": 1,
"cluster": {
"id": 12,
"label": "text",
"bbox": {
"l": 50.1,
"t": 75.2,
"r": 286.4,
"b": 96.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.1,
"r_x1": 286.4,
"r_y1": 84.1,
"r_x2": 286.4,
"r_y2": 75.2,
"r_x3": 50.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "considered as a solved problem, given enough ground-truth",
"orig": "considered as a solved problem, given enough ground-truth",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 96.1,
"r_x1": 112.6,
"r_y1": 96.1,
"r_x2": 112.6,
"r_y2": 87.2,
"r_x3": 50.1,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "data to train on.",
"orig": "data to train on.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "considered as a solved problem, given enough ground-truth data to train on."
},
{
"label": "text",
"id": 4,
"page_no": 1,
"cluster": {
"id": 4,
"label": "text",
"bbox": {
"l": 50.1,
"t": 99.6,
"r": 286.4,
"b": 228.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 108.5,
"r_x1": 286.4,
"r_y1": 108.5,
"r_x2": 286.4,
"r_y2": 99.6,
"r_x3": 62.1,
"r_y3": 99.6,
"coord_origin": "TOPLEFT"
},
"text": "The second problem is called table-structure decompo-",
"orig": "The second problem is called table-structure decompo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 120.4,
"r_x1": 74.7,
"r_y1": 120.4,
"r_x2": 74.7,
"r_y2": 111.5,
"r_x3": 50.1,
"r_y3": 111.5,
"coord_origin": "TOPLEFT"
},
"text": "sition.",
"orig": "sition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.3,
"r_y0": 120.4,
"r_x1": 286.4,
"r_y1": 120.4,
"r_x2": 286.4,
"r_y2": 111.5,
"r_x3": 81.3,
"r_y3": 111.5,
"coord_origin": "TOPLEFT"
},
"text": "The latter is a long standing problem in the com-",
"orig": "The latter is a long standing problem in the com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 132.4,
"r_x1": 286.4,
"r_y1": 132.4,
"r_x2": 286.4,
"r_y2": 123.5,
"r_x3": 50.1,
"r_y3": 123.5,
"coord_origin": "TOPLEFT"
},
"text": "munity of document understanding [6, 4, 14]. Contrary to",
"orig": "munity of document understanding [6, 4, 14]. Contrary to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 144.3,
"r_x1": 286.4,
"r_y1": 144.3,
"r_x2": 286.4,
"r_y2": 135.4,
"r_x3": 50.1,
"r_y3": 135.4,
"coord_origin": "TOPLEFT"
},
"text": "the table-location problem, there are no commonly used ap-",
"orig": "the table-location problem, there are no commonly used ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 156.3,
"r_x1": 286.4,
"r_y1": 156.3,
"r_x2": 286.4,
"r_y2": 147.4,
"r_x3": 50.1,
"r_y3": 147.4,
"coord_origin": "TOPLEFT"
},
"text": "proaches that can easily be re-purposed to solve this prob-",
"orig": "proaches that can easily be re-purposed to solve this prob-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 168.3,
"r_x1": 286.4,
"r_y1": 168.3,
"r_x2": 286.4,
"r_y2": 159.3,
"r_x3": 50.1,
"r_y3": 159.3,
"coord_origin": "TOPLEFT"
},
"text": "lem. Lately, a set of new model-architectures has been pro-",
"orig": "lem. Lately, a set of new model-architectures has been pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 180.2,
"r_x1": 286.4,
"r_y1": 180.2,
"r_x2": 286.4,
"r_y2": 171.3,
"r_x3": 50.1,
"r_y3": 171.3,
"coord_origin": "TOPLEFT"
},
"text": "posed by the community to address table-structure decom-",
"orig": "posed by the community to address table-structure decom-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 192.2,
"r_x1": 286.4,
"r_y1": 192.2,
"r_x2": 286.4,
"r_y2": 183.3,
"r_x3": 50.1,
"r_y3": 183.3,
"coord_origin": "TOPLEFT"
},
"text": "position [37, 36, 18, 20]. All these models have some weak-",
"orig": "position [37, 36, 18, 20]. All these models have some weak-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 204.1,
"r_x1": 286.4,
"r_y1": 204.1,
"r_x2": 286.4,
"r_y2": 195.2,
"r_x3": 50.1,
"r_y3": 195.2,
"coord_origin": "TOPLEFT"
},
"text": "nesses (see Sec. 2). The common denominator here is the",
"orig": "nesses (see Sec. 2). The common denominator here is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 216.1,
"r_x1": 286.4,
"r_y1": 216.1,
"r_x2": 286.4,
"r_y2": 207.2,
"r_x3": 50.1,
"r_y3": 207.2,
"coord_origin": "TOPLEFT"
},
"text": "reliance on textual features and/or the inability to provide",
"orig": "reliance on textual features and/or the inability to provide",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 228.0,
"r_x1": 278.7,
"r_y1": 228.0,
"r_x2": 278.7,
"r_y2": 219.1,
"r_x3": 50.1,
"r_y3": 219.1,
"coord_origin": "TOPLEFT"
},
"text": "the bounding box of each table-cell in the original image.",
"orig": "the bounding box of each table-cell in the original image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The second problem is called table-structure decomposition. The latter is a long standing problem in the community of document understanding [6, 4, 14]. Contrary to the table-location problem, there are no commonly used approaches that can easily be re-purposed to solve this problem. Lately, a set of new model-architectures has been proposed by the community to address table-structure decomposition [37, 36, 18, 20]. All these models have some weaknesses (see Sec. 2). The common denominator here is the reliance on textual features and/or the inability to provide the bounding box of each table-cell in the original image."
},
{
"label": "text",
"id": 2,
"page_no": 1,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 50.1,
"t": 231.5,
"r": 286.4,
"b": 371.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 240.4,
"r_x1": 286.4,
"r_y1": 240.4,
"r_x2": 286.4,
"r_y2": 231.5,
"r_x3": 62.1,
"r_y3": 231.5,
"coord_origin": "TOPLEFT"
},
"text": "In this paper, we want to address these weaknesses and",
"orig": "In this paper, we want to address these weaknesses and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 252.4,
"r_x1": 286.4,
"r_y1": 252.4,
"r_x2": 286.4,
"r_y2": 243.5,
"r_x3": 50.1,
"r_y3": 243.5,
"coord_origin": "TOPLEFT"
},
"text": "present a robust table-structure decomposition algorithm.",
"orig": "present a robust table-structure decomposition algorithm.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 264.3,
"r_x1": 286.4,
"r_y1": 264.3,
"r_x2": 286.4,
"r_y2": 255.4,
"r_x3": 50.1,
"r_y3": 255.4,
"coord_origin": "TOPLEFT"
},
"text": "The design criteria for our model are the following. First,",
"orig": "The design criteria for our model are the following. First,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 276.3,
"r_x1": 286.4,
"r_y1": 276.3,
"r_x2": 286.4,
"r_y2": 267.4,
"r_x3": 50.1,
"r_y3": 267.4,
"coord_origin": "TOPLEFT"
},
"text": "we want our algorithm to be language agnostic. In this way,",
"orig": "we want our algorithm to be language agnostic. In this way,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 288.3,
"r_x1": 286.4,
"r_y1": 288.3,
"r_x2": 286.4,
"r_y2": 279.4,
"r_x3": 50.1,
"r_y3": 279.4,
"coord_origin": "TOPLEFT"
},
"text": "we can obtain the structure of any table, irregardless of the",
"orig": "we can obtain the structure of any table, irregardless of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 300.2,
"r_x1": 88.6,
"r_y1": 300.2,
"r_x2": 88.6,
"r_y2": 291.3,
"r_x3": 50.1,
"r_y3": 291.3,
"coord_origin": "TOPLEFT"
},
"text": "language.",
"orig": "language.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 95.5,
"r_y0": 300.2,
"r_x1": 286.4,
"r_y1": 300.2,
"r_x2": 286.4,
"r_y2": 291.3,
"r_x3": 95.5,
"r_y3": 291.3,
"coord_origin": "TOPLEFT"
},
"text": "Second, we want our algorithm to leverage as",
"orig": "Second, we want our algorithm to leverage as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 312.2,
"r_x1": 286.4,
"r_y1": 312.2,
"r_x2": 286.4,
"r_y2": 303.3,
"r_x3": 50.1,
"r_y3": 303.3,
"coord_origin": "TOPLEFT"
},
"text": "much data as possible from the original PDF document. For",
"orig": "much data as possible from the original PDF document. For",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 324.1,
"r_x1": 286.4,
"r_y1": 324.1,
"r_x2": 286.4,
"r_y2": 315.2,
"r_x3": 50.1,
"r_y3": 315.2,
"coord_origin": "TOPLEFT"
},
"text": "programmatic PDF documents, the text-cells can often be",
"orig": "programmatic PDF documents, the text-cells can often be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 336.1,
"r_x1": 286.4,
"r_y1": 336.1,
"r_x2": 286.4,
"r_y2": 327.2,
"r_x3": 50.1,
"r_y3": 327.2,
"coord_origin": "TOPLEFT"
},
"text": "extracted much faster and with higher accuracy compared",
"orig": "extracted much faster and with higher accuracy compared",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 348.0,
"r_x1": 286.4,
"r_y1": 348.0,
"r_x2": 286.4,
"r_y2": 339.1,
"r_x3": 50.1,
"r_y3": 339.1,
"coord_origin": "TOPLEFT"
},
"text": "to OCR methods. Last but not least, we want to have a di-",
"orig": "to OCR methods. Last but not least, we want to have a di-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 360.0,
"r_x1": 286.4,
"r_y1": 360.0,
"r_x2": 286.4,
"r_y2": 351.1,
"r_x3": 50.1,
"r_y3": 351.1,
"coord_origin": "TOPLEFT"
},
"text": "rect link between the table-cell and its bounding box in the",
"orig": "rect link between the table-cell and its bounding box in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 371.9,
"r_x1": 77.0,
"r_y1": 371.9,
"r_x2": 77.0,
"r_y2": 363.0,
"r_x3": 50.1,
"r_y3": 363.0,
"coord_origin": "TOPLEFT"
},
"text": "image.",
"orig": "image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "In this paper, we want to address these weaknesses and present a robust table-structure decomposition algorithm. The design criteria for our model are the following. First, we want our algorithm to be language agnostic. In this way, we can obtain the structure of any table, irregardless of the language. Second, we want our algorithm to leverage as much data as possible from the original PDF document. For programmatic PDF documents, the text-cells can often be extracted much faster and with higher accuracy compared to OCR methods. Last but not least, we want to have a direct link between the table-cell and its bounding box in the image."
},
{
"label": "text",
"id": 7,
"page_no": 1,
"cluster": {
"id": 7,
"label": "text",
"bbox": {
"l": 50.1,
"t": 375.4,
"r": 286.4,
"b": 432.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 384.4,
"r_x1": 286.4,
"r_y1": 384.4,
"r_x2": 286.4,
"r_y2": 375.4,
"r_x3": 62.1,
"r_y3": 375.4,
"coord_origin": "TOPLEFT"
},
"text": "To meet the design criteria listed above, we developed a",
"orig": "To meet the design criteria listed above, we developed a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 396.3,
"r_x1": 121.0,
"r_y1": 396.3,
"r_x2": 121.0,
"r_y2": 387.4,
"r_x3": 50.1,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "new model called",
"orig": "new model called",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 123.9,
"r_y0": 396.2,
"r_x1": 179.7,
"r_y1": 396.2,
"r_x2": 179.7,
"r_y2": 387.3,
"r_x3": 123.9,
"r_y3": 387.3,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.6,
"r_y0": 396.3,
"r_x1": 286.4,
"r_y1": 396.3,
"r_x2": 286.4,
"r_y2": 387.4,
"r_x3": 182.6,
"r_y3": 387.4,
"coord_origin": "TOPLEFT"
},
"text": "and a synthetically gener-",
"orig": "and a synthetically gener-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 408.3,
"r_x1": 181.8,
"r_y1": 408.3,
"r_x2": 181.8,
"r_y2": 399.4,
"r_x3": 50.1,
"r_y3": 399.4,
"coord_origin": "TOPLEFT"
},
"text": "ated table structure dataset called",
"orig": "ated table structure dataset called",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.1,
"r_y0": 408.2,
"r_x1": 240.2,
"r_y1": 408.2,
"r_x2": 240.2,
"r_y2": 399.2,
"r_x3": 184.1,
"r_y3": 399.2,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 240.2,
"r_y0": 408.3,
"r_x1": 286.4,
"r_y1": 408.3,
"r_x2": 286.4,
"r_y2": 399.4,
"r_x3": 240.2,
"r_y3": 399.4,
"coord_origin": "TOPLEFT"
},
"text": "$^{1}$. In partic-",
"orig": "$^{1}$. In partic-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 420.2,
"r_x1": 286.4,
"r_y1": 420.2,
"r_x2": 286.4,
"r_y2": 411.3,
"r_x3": 50.1,
"r_y3": 411.3,
"coord_origin": "TOPLEFT"
},
"text": "ular, our contributions in this work can be summarised as",
"orig": "ular, our contributions in this work can be summarised as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 432.2,
"r_x1": 82.5,
"r_y1": 432.2,
"r_x2": 82.5,
"r_y2": 423.3,
"r_x3": 50.1,
"r_y3": 423.3,
"coord_origin": "TOPLEFT"
},
"text": "follows:",
"orig": "follows:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "To meet the design criteria listed above, we developed a new model called TableFormer and a synthetically generated table structure dataset called SynthTabNet $^{1}$. In particular, our contributions in this work can be summarised as follows:"
},
{
"label": "list_item",
"id": 6,
"page_no": 1,
"cluster": {
"id": 6,
"label": "list_item",
"bbox": {
"l": 61.6,
"t": 444.4,
"r": 286.4,
"b": 489.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 453.5,
"r_x1": 70.7,
"r_y1": 453.5,
"r_x2": 70.7,
"r_y2": 444.6,
"r_x3": 61.6,
"r_y3": 444.6,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.0,
"r_y0": 453.5,
"r_x1": 117.1,
"r_y1": 453.5,
"r_x2": 117.1,
"r_y2": 444.6,
"r_x3": 73.0,
"r_y3": 444.6,
"coord_origin": "TOPLEFT"
},
"text": "We propose",
"orig": "We propose",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.6,
"r_y0": 453.4,
"r_x1": 175.4,
"r_y1": 453.4,
"r_x2": 175.4,
"r_y2": 444.4,
"r_x3": 119.6,
"r_y3": 444.4,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.4,
"r_y0": 453.5,
"r_x1": 286.4,
"r_y1": 453.5,
"r_x2": 286.4,
"r_y2": 444.6,
"r_x3": 175.4,
"r_y3": 444.6,
"coord_origin": "TOPLEFT"
},
"text": ", a transformer based model",
"orig": ", a transformer based model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 465.4,
"r_x1": 286.4,
"r_y1": 465.4,
"r_x2": 286.4,
"r_y2": 456.5,
"r_x3": 70.0,
"r_y3": 456.5,
"coord_origin": "TOPLEFT"
},
"text": "that predicts tables structure and bounding boxes for",
"orig": "that predicts tables structure and bounding boxes for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 477.4,
"r_x1": 286.4,
"r_y1": 477.4,
"r_x2": 286.4,
"r_y2": 468.5,
"r_x3": 70.0,
"r_y3": 468.5,
"coord_origin": "TOPLEFT"
},
"text": "the table content simultaneously in an end-to-end ap-",
"orig": "the table content simultaneously in an end-to-end ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 489.3,
"r_x1": 99.6,
"r_y1": 489.3,
"r_x2": 99.6,
"r_y2": 480.4,
"r_x3": 70.0,
"r_y3": 480.4,
"coord_origin": "TOPLEFT"
},
"text": "proach.",
"orig": "proach.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 We propose TableFormer , a transformer based model that predicts tables structure and bounding boxes for the table content simultaneously in an end-to-end approach."
},
{
"label": "list_item",
"id": 5,
"page_no": 1,
"cluster": {
"id": 5,
"label": "list_item",
"bbox": {
"l": 61.6,
"t": 502.0,
"r": 286.4,
"b": 546.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 511.1,
"r_x1": 71.6,
"r_y1": 511.1,
"r_x2": 71.6,
"r_y2": 502.2,
"r_x3": 61.6,
"r_y3": 502.2,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.1,
"r_y0": 511.1,
"r_x1": 196.1,
"r_y1": 511.1,
"r_x2": 196.1,
"r_y2": 502.2,
"r_x3": 74.1,
"r_y3": 502.2,
"coord_origin": "TOPLEFT"
},
"text": "Across all benchmark datasets",
"orig": "Across all benchmark datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.3,
"r_y0": 511.0,
"r_x1": 256.1,
"r_y1": 511.0,
"r_x2": 256.1,
"r_y2": 502.0,
"r_x3": 200.3,
"r_y3": 502.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 260.4,
"r_y0": 511.1,
"r_x1": 286.4,
"r_y1": 511.1,
"r_x2": 286.4,
"r_y2": 502.2,
"r_x3": 260.4,
"r_y3": 502.2,
"coord_origin": "TOPLEFT"
},
"text": "signif-",
"orig": "signif-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 523.0,
"r_x1": 286.4,
"r_y1": 523.0,
"r_x2": 286.4,
"r_y2": 514.1,
"r_x3": 70.0,
"r_y3": 514.1,
"coord_origin": "TOPLEFT"
},
"text": "icantly outperforms existing state-of-the-art metrics,",
"orig": "icantly outperforms existing state-of-the-art metrics,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 535.0,
"r_x1": 286.4,
"r_y1": 535.0,
"r_x2": 286.4,
"r_y2": 526.1,
"r_x3": 70.0,
"r_y3": 526.1,
"coord_origin": "TOPLEFT"
},
"text": "while being much more efficient in training and infer-",
"orig": "while being much more efficient in training and infer-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 546.9,
"r_x1": 161.7,
"r_y1": 546.9,
"r_x2": 161.7,
"r_y2": 538.0,
"r_x3": 70.0,
"r_y3": 538.0,
"coord_origin": "TOPLEFT"
},
"text": "ence to existing works.",
"orig": "ence to existing works.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 Across all benchmark datasets TableFormer significantly outperforms existing state-of-the-art metrics, while being much more efficient in training and inference to existing works."
},
{
"label": "list_item",
"id": 9,
"page_no": 1,
"cluster": {
"id": 9,
"label": "list_item",
"bbox": {
"l": 61.6,
"t": 559.6,
"r": 286.4,
"b": 592.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 568.7,
"r_x1": 71.1,
"r_y1": 568.7,
"r_x2": 71.1,
"r_y2": 559.8,
"r_x3": 61.6,
"r_y3": 559.8,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.5,
"r_y0": 568.7,
"r_x1": 116.7,
"r_y1": 568.7,
"r_x2": 116.7,
"r_y2": 559.8,
"r_x3": 73.5,
"r_y3": 559.8,
"coord_origin": "TOPLEFT"
},
"text": "We present",
"orig": "We present",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 121.6,
"r_y0": 568.6,
"r_x1": 177.7,
"r_y1": 568.6,
"r_x2": 177.7,
"r_y2": 559.6,
"r_x3": 121.6,
"r_y3": 559.6,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.6,
"r_y0": 568.7,
"r_x1": 286.4,
"r_y1": 568.7,
"r_x2": 286.4,
"r_y2": 559.8,
"r_x3": 182.6,
"r_y3": 559.8,
"coord_origin": "TOPLEFT"
},
"text": "a synthetically generated",
"orig": "a synthetically generated",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 580.6,
"r_x1": 286.4,
"r_y1": 580.6,
"r_x2": 286.4,
"r_y2": 571.7,
"r_x3": 70.0,
"r_y3": 571.7,
"coord_origin": "TOPLEFT"
},
"text": "dataset, with various appearance styles and complex-",
"orig": "dataset, with various appearance styles and complex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 592.6,
"r_x1": 82.4,
"r_y1": 592.6,
"r_x2": 82.4,
"r_y2": 583.7,
"r_x3": 70.0,
"r_y3": 583.7,
"coord_origin": "TOPLEFT"
},
"text": "ity.",
"orig": "ity.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 We present SynthTabNet a synthetically generated dataset, with various appearance styles and complexity."
},
{
"label": "list_item",
"id": 8,
"page_no": 1,
"cluster": {
"id": 8,
"label": "list_item",
"bbox": {
"l": 61.6,
"t": 605.4,
"r": 286.4,
"b": 638.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 614.3,
"r_x1": 72.3,
"r_y1": 614.3,
"r_x2": 72.3,
"r_y2": 605.4,
"r_x3": 61.6,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 75.0,
"r_y0": 614.3,
"r_x1": 286.4,
"r_y1": 614.3,
"r_x2": 286.4,
"r_y2": 605.4,
"r_x3": 75.0,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "An augmented dataset based on PubTabNet [37],",
"orig": "An augmented dataset based on PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 626.3,
"r_x1": 286.4,
"r_y1": 626.3,
"r_x2": 286.4,
"r_y2": 617.4,
"r_x3": 70.0,
"r_y3": 617.4,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet [36], and TableBank [17] with generated",
"orig": "FinTabNet [36], and TableBank [17] with generated",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 638.2,
"r_x1": 198.1,
"r_y1": 638.2,
"r_x2": 198.1,
"r_y2": 629.3,
"r_x3": 70.0,
"r_y3": 629.3,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth for reproducibility.",
"orig": "ground-truth for reproducibility.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 An augmented dataset based on PubTabNet [37], FinTabNet [36], and TableBank [17] with generated ground-truth for reproducibility."
},
{
"label": "text",
"id": 11,
"page_no": 1,
"cluster": {
"id": 11,
"label": "text",
"bbox": {
"l": 50.1,
"t": 650.6,
"r": 286.4,
"b": 695.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 659.5,
"r_x1": 286.4,
"r_y1": 659.5,
"r_x2": 286.4,
"r_y2": 650.6,
"r_x3": 62.1,
"r_y3": 650.6,
"coord_origin": "TOPLEFT"
},
"text": "The paper is structured as follows. In Sec. 2, we give",
"orig": "The paper is structured as follows. In Sec. 2, we give",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 671.5,
"r_x1": 286.4,
"r_y1": 671.5,
"r_x2": 286.4,
"r_y2": 662.6,
"r_x3": 50.1,
"r_y3": 662.6,
"coord_origin": "TOPLEFT"
},
"text": "a brief overview of the current state-of-the-art. In Sec. 3,",
"orig": "a brief overview of the current state-of-the-art. In Sec. 3,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 683.4,
"r_x1": 286.4,
"r_y1": 683.4,
"r_x2": 286.4,
"r_y2": 674.5,
"r_x3": 50.1,
"r_y3": 674.5,
"coord_origin": "TOPLEFT"
},
"text": "we describe the datasets on which we train. In Sec. 4, we",
"orig": "we describe the datasets on which we train. In Sec. 4, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 695.4,
"r_x1": 286.4,
"r_y1": 695.4,
"r_x2": 286.4,
"r_y2": 686.5,
"r_x3": 50.1,
"r_y3": 686.5,
"coord_origin": "TOPLEFT"
},
"text": "introduce the TableFormer model-architecture and describe",
"orig": "introduce the TableFormer model-architecture and describe",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The paper is structured as follows. In Sec. 2, we give a brief overview of the current state-of-the-art. In Sec. 3, we describe the datasets on which we train. In Sec. 4, we introduce the TableFormer model-architecture and describe"
},
{
"label": "footnote",
"id": 14,
"page_no": 1,
"cluster": {
"id": 14,
"label": "footnote",
"bbox": {
"l": 61.0,
"t": 705.6,
"r": 183.7,
"b": 712.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.0,
"r_y0": 712.7,
"r_x1": 183.7,
"r_y1": 712.7,
"r_x2": 183.7,
"r_y2": 705.6,
"r_x3": 61.0,
"r_y3": 705.6,
"coord_origin": "TOPLEFT"
},
"text": "$^{1}$https://github.com/IBM/SynthTabNet",
"orig": "$^{1}$https://github.com/IBM/SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "$^{1}$https://github.com/IBM/SynthTabNet"
},
{
"label": "text",
"id": 10,
"page_no": 1,
"cluster": {
"id": 10,
"label": "text",
"bbox": {
"l": 308.9,
"t": 75.2,
"r": 545.1,
"b": 108.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 84.1,
"r_x1": 545.1,
"r_y1": 84.1,
"r_x2": 545.1,
"r_y2": 75.2,
"r_x3": 308.9,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "its results & performance in Sec. 5. As a conclusion, we de-",
"orig": "its results & performance in Sec. 5. As a conclusion, we de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 96.1,
"r_x1": 545.1,
"r_y1": 96.1,
"r_x2": 545.1,
"r_y2": 87.2,
"r_x3": 308.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "scribe how this new model-architecture can be re-purposed",
"orig": "scribe how this new model-architecture can be re-purposed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 108.0,
"r_x1": 508.1,
"r_y1": 108.0,
"r_x2": 508.1,
"r_y2": 99.1,
"r_x3": 308.9,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "for other tasks in the computer-vision community.",
"orig": "for other tasks in the computer-vision community.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "its results & performance in Sec. 5. As a conclusion, we describe how this new model-architecture can be re-purposed for other tasks in the computer-vision community."
},
{
"label": "section_header",
"id": 13,
"page_no": 1,
"cluster": {
"id": 13,
"label": "section_header",
"bbox": {
"l": 308.9,
"t": 121.7,
"r": 498.3,
"b": 132.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 132.5,
"r_x1": 315.6,
"r_y1": 132.5,
"r_x2": 315.6,
"r_y2": 121.7,
"r_x3": 308.9,
"r_y3": 121.7,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 324.5,
"r_y0": 132.5,
"r_x1": 498.3,
"r_y1": 132.5,
"r_x2": 498.3,
"r_y2": 121.7,
"r_x3": 324.5,
"r_y3": 121.7,
"coord_origin": "TOPLEFT"
},
"text": "Previous work and State of the Art",
"orig": "Previous work and State of the Art",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "2. Previous work and State of the Art"
},
{
"label": "text",
"id": 0,
"page_no": 1,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 308.9,
"t": 142.2,
"r": 545.1,
"b": 330.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 151.1,
"r_x1": 545.1,
"r_y1": 151.1,
"r_x2": 545.1,
"r_y2": 142.2,
"r_x3": 320.8,
"r_y3": 142.2,
"coord_origin": "TOPLEFT"
},
"text": "Identifying the structure of a table has been an outstand-",
"orig": "Identifying the structure of a table has been an outstand-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 163.1,
"r_x1": 545.1,
"r_y1": 163.1,
"r_x2": 545.1,
"r_y2": 154.2,
"r_x3": 308.9,
"r_y3": 154.2,
"coord_origin": "TOPLEFT"
},
"text": "ing problem in the document-parsing community, that mo-",
"orig": "ing problem in the document-parsing community, that mo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 175.0,
"r_x1": 522.6,
"r_y1": 175.0,
"r_x2": 522.6,
"r_y2": 166.1,
"r_x3": 308.9,
"r_y3": 166.1,
"coord_origin": "TOPLEFT"
},
"text": "tivates many organised public challenges [6, 4, 14].",
"orig": "tivates many organised public challenges [6, 4, 14].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 529.6,
"r_y0": 175.0,
"r_x1": 545.1,
"r_y1": 175.0,
"r_x2": 545.1,
"r_y2": 166.1,
"r_x3": 529.6,
"r_y3": 166.1,
"coord_origin": "TOPLEFT"
},
"text": "The",
"orig": "The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 187.0,
"r_x1": 545.1,
"r_y1": 187.0,
"r_x2": 545.1,
"r_y2": 178.1,
"r_x3": 308.9,
"r_y3": 178.1,
"coord_origin": "TOPLEFT"
},
"text": "difficulty of the problem can be attributed to a number of",
"orig": "difficulty of the problem can be attributed to a number of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 198.9,
"r_x1": 545.1,
"r_y1": 198.9,
"r_x2": 545.1,
"r_y2": 190.0,
"r_x3": 308.9,
"r_y3": 190.0,
"coord_origin": "TOPLEFT"
},
"text": "factors. First, there is a large variety in the shapes and sizes",
"orig": "factors. First, there is a large variety in the shapes and sizes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 210.9,
"r_x1": 347.0,
"r_y1": 210.9,
"r_x2": 347.0,
"r_y2": 202.0,
"r_x3": 308.9,
"r_y3": 202.0,
"coord_origin": "TOPLEFT"
},
"text": "of tables.",
"orig": "of tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.9,
"r_y0": 210.9,
"r_x1": 545.1,
"r_y1": 210.9,
"r_x2": 545.1,
"r_y2": 202.0,
"r_x3": 354.9,
"r_y3": 202.0,
"coord_origin": "TOPLEFT"
},
"text": "Such large variety requires a flexible method.",
"orig": "Such large variety requires a flexible method.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 222.9,
"r_x1": 545.1,
"r_y1": 222.9,
"r_x2": 545.1,
"r_y2": 214.0,
"r_x3": 308.9,
"r_y3": 214.0,
"coord_origin": "TOPLEFT"
},
"text": "This is especially true for complex column- and row head-",
"orig": "This is especially true for complex column- and row head-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 234.8,
"r_x1": 530.9,
"r_y1": 234.8,
"r_x2": 530.9,
"r_y2": 225.9,
"r_x3": 308.9,
"r_y3": 225.9,
"coord_origin": "TOPLEFT"
},
"text": "ers, which can be extremely intricate and demanding.",
"orig": "ers, which can be extremely intricate and demanding.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 537.9,
"r_y0": 234.8,
"r_x1": 545.1,
"r_y1": 234.8,
"r_x2": 545.1,
"r_y2": 225.9,
"r_x3": 537.9,
"r_y3": 225.9,
"coord_origin": "TOPLEFT"
},
"text": "A",
"orig": "A",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 246.8,
"r_x1": 545.1,
"r_y1": 246.8,
"r_x2": 545.1,
"r_y2": 237.9,
"r_x3": 308.9,
"r_y3": 237.9,
"coord_origin": "TOPLEFT"
},
"text": "second factor of complexity is the lack of data with regard",
"orig": "second factor of complexity is the lack of data with regard",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 258.7,
"r_x1": 545.1,
"r_y1": 258.7,
"r_x2": 545.1,
"r_y2": 249.8,
"r_x3": 308.9,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "to table-structure. Until the publication of PubTabNet [37],",
"orig": "to table-structure. Until the publication of PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 270.7,
"r_x1": 439.8,
"r_y1": 270.7,
"r_x2": 439.8,
"r_y2": 261.8,
"r_x3": 308.9,
"r_y3": 261.8,
"coord_origin": "TOPLEFT"
},
"text": "there were no large datasets (i.e.",
"orig": "there were no large datasets (i.e.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 444.4,
"r_y0": 270.5,
"r_x1": 452.2,
"r_y1": 270.5,
"r_x2": 452.2,
"r_y2": 261.6,
"r_x3": 444.4,
"r_y3": 261.6,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.9,
"r_y0": 270.5,
"r_x1": 470.8,
"r_y1": 270.5,
"r_x2": 470.8,
"r_y2": 261.6,
"r_x3": 455.9,
"r_y3": 261.6,
"coord_origin": "TOPLEFT"
},
"text": "100",
"orig": "100",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 470.8,
"r_y0": 270.7,
"r_x1": 545.1,
"r_y1": 270.7,
"r_x2": 545.1,
"r_y2": 261.8,
"r_x3": 470.8,
"r_y3": 261.8,
"coord_origin": "TOPLEFT"
},
"text": "K tables) that pro-",
"orig": "K tables) that pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 282.6,
"r_x1": 545.1,
"r_y1": 282.6,
"r_x2": 545.1,
"r_y2": 273.7,
"r_x3": 308.9,
"r_y3": 273.7,
"coord_origin": "TOPLEFT"
},
"text": "vided structure information. This happens primarily due to",
"orig": "vided structure information. This happens primarily due to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 294.6,
"r_x1": 545.1,
"r_y1": 294.6,
"r_x2": 545.1,
"r_y2": 285.7,
"r_x3": 308.9,
"r_y3": 285.7,
"coord_origin": "TOPLEFT"
},
"text": "the fact that tables are notoriously time-consuming to an-",
"orig": "the fact that tables are notoriously time-consuming to an-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 306.5,
"r_x1": 545.1,
"r_y1": 306.5,
"r_x2": 545.1,
"r_y2": 297.6,
"r_x3": 308.9,
"r_y3": 297.6,
"coord_origin": "TOPLEFT"
},
"text": "notate by hand. However, this has definitely changed in re-",
"orig": "notate by hand. However, this has definitely changed in re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 318.5,
"r_x1": 545.1,
"r_y1": 318.5,
"r_x2": 545.1,
"r_y2": 309.6,
"r_x3": 308.9,
"r_y3": 309.6,
"coord_origin": "TOPLEFT"
},
"text": "cent years with the deliverance of PubTabNet [37], FinTab-",
"orig": "cent years with the deliverance of PubTabNet [37], FinTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 330.5,
"r_x1": 425.9,
"r_y1": 330.5,
"r_x2": 425.9,
"r_y2": 321.5,
"r_x3": 308.9,
"r_y3": 321.5,
"coord_origin": "TOPLEFT"
},
"text": "Net [36], TableBank [17] etc.",
"orig": "Net [36], TableBank [17] etc.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Identifying the structure of a table has been an outstanding problem in the document-parsing community, that motivates many organised public challenges [6, 4, 14]. The difficulty of the problem can be attributed to a number of factors. First, there is a large variety in the shapes and sizes of tables. Such large variety requires a flexible method. This is especially true for complex column- and row headers, which can be extremely intricate and demanding. A second factor of complexity is the lack of data with regard to table-structure. Until the publication of PubTabNet [37], there were no large datasets (i.e. > 100 K tables) that provided structure information. This happens primarily due to the fact that tables are notoriously time-consuming to annotate by hand. However, this has definitely changed in recent years with the deliverance of PubTabNet [37], FinTabNet [36], TableBank [17] etc."
},
{
"label": "text",
"id": 1,
"page_no": 1,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 308.9,
"t": 333.6,
"r": 545.1,
"b": 450.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 342.5,
"r_x1": 545.1,
"r_y1": 342.5,
"r_x2": 545.1,
"r_y2": 333.6,
"r_x3": 320.8,
"r_y3": 333.6,
"coord_origin": "TOPLEFT"
},
"text": "Before the rising popularity of deep neural networks,",
"orig": "Before the rising popularity of deep neural networks,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 354.4,
"r_x1": 545.1,
"r_y1": 354.4,
"r_x2": 545.1,
"r_y2": 345.5,
"r_x3": 308.9,
"r_y3": 345.5,
"coord_origin": "TOPLEFT"
},
"text": "the community relied heavily on heuristic and/or statistical",
"orig": "the community relied heavily on heuristic and/or statistical",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 366.4,
"r_x1": 545.1,
"r_y1": 366.4,
"r_x2": 545.1,
"r_y2": 357.5,
"r_x3": 308.9,
"r_y3": 357.5,
"coord_origin": "TOPLEFT"
},
"text": "methods to do table structure identification [3, 7, 11, 5, 13,",
"orig": "methods to do table structure identification [3, 7, 11, 5, 13,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 378.3,
"r_x1": 545.1,
"r_y1": 378.3,
"r_x2": 545.1,
"r_y2": 369.4,
"r_x3": 308.9,
"r_y3": 369.4,
"coord_origin": "TOPLEFT"
},
"text": "28]. Although such methods work well on constrained ta-",
"orig": "28]. Although such methods work well on constrained ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 390.3,
"r_x1": 545.1,
"r_y1": 390.3,
"r_x2": 545.1,
"r_y2": 381.4,
"r_x3": 308.9,
"r_y3": 381.4,
"coord_origin": "TOPLEFT"
},
"text": "bles [12], a more data-driven approach can be applied due",
"orig": "bles [12], a more data-driven approach can be applied due",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 402.3,
"r_x1": 545.1,
"r_y1": 402.3,
"r_x2": 545.1,
"r_y2": 393.3,
"r_x3": 308.9,
"r_y3": 393.3,
"coord_origin": "TOPLEFT"
},
"text": "to the advent of convolutional neural networks (CNNs) and",
"orig": "to the advent of convolutional neural networks (CNNs) and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 414.2,
"r_x1": 545.1,
"r_y1": 414.2,
"r_x2": 545.1,
"r_y2": 405.3,
"r_x3": 308.9,
"r_y3": 405.3,
"coord_origin": "TOPLEFT"
},
"text": "the availability of large datasets. To the best-of-our knowl-",
"orig": "the availability of large datasets. To the best-of-our knowl-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 426.2,
"r_x1": 545.1,
"r_y1": 426.2,
"r_x2": 545.1,
"r_y2": 417.3,
"r_x3": 308.9,
"r_y3": 417.3,
"coord_origin": "TOPLEFT"
},
"text": "edge, there are currently two different types of network ar-",
"orig": "edge, there are currently two different types of network ar-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 438.1,
"r_x1": 545.1,
"r_y1": 438.1,
"r_x2": 545.1,
"r_y2": 429.2,
"r_x3": 308.9,
"r_y3": 429.2,
"coord_origin": "TOPLEFT"
},
"text": "chitecture that are being pursued for state-of-the-art table-",
"orig": "chitecture that are being pursued for state-of-the-art table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 450.1,
"r_x1": 401.3,
"r_y1": 450.1,
"r_x2": 401.3,
"r_y2": 441.2,
"r_x3": 308.9,
"r_y3": 441.2,
"coord_origin": "TOPLEFT"
},
"text": "structure identification.",
"orig": "structure identification.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Before the rising popularity of deep neural networks, the community relied heavily on heuristic and/or statistical methods to do table structure identification [3, 7, 11, 5, 13, 28]. Although such methods work well on constrained tables [12], a more data-driven approach can be applied due to the advent of convolutional neural networks (CNNs) and the availability of large datasets. To the best-of-our knowledge, there are currently two different types of network architecture that are being pursued for state-of-the-art tablestructure identification."
},
{
"label": "text",
"id": 3,
"page_no": 1,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 308.9,
"t": 453.1,
"r": 545.1,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 462.0,
"r_x1": 423.3,
"r_y1": 462.0,
"r_x2": 423.3,
"r_y2": 453.1,
"r_x3": 320.8,
"r_y3": 453.1,
"coord_origin": "TOPLEFT"
},
"text": "Image-to-Text networks",
"orig": "Image-to-Text networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 423.3,
"r_y0": 462.1,
"r_x1": 545.1,
"r_y1": 462.1,
"r_x2": 545.1,
"r_y2": 453.2,
"r_x3": 423.3,
"r_y3": 453.2,
"coord_origin": "TOPLEFT"
},
"text": ": In this type of network, one",
"orig": ": In this type of network, one",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 474.0,
"r_x1": 545.1,
"r_y1": 474.0,
"r_x2": 545.1,
"r_y2": 465.1,
"r_x3": 308.9,
"r_y3": 465.1,
"coord_origin": "TOPLEFT"
},
"text": "predicts a sequence of tokens starting from an encoded",
"orig": "predicts a sequence of tokens starting from an encoded",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 486.0,
"r_x1": 335.7,
"r_y1": 486.0,
"r_x2": 335.7,
"r_y2": 477.1,
"r_x3": 308.9,
"r_y3": 477.1,
"coord_origin": "TOPLEFT"
},
"text": "image.",
"orig": "image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.9,
"r_y0": 486.0,
"r_x1": 545.1,
"r_y1": 486.0,
"r_x2": 545.1,
"r_y2": 477.1,
"r_x3": 345.9,
"r_y3": 477.1,
"coord_origin": "TOPLEFT"
},
"text": "Such sequences of tokens can be HTML table",
"orig": "Such sequences of tokens can be HTML table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 498.0,
"r_x1": 545.1,
"r_y1": 498.0,
"r_x2": 545.1,
"r_y2": 489.1,
"r_x3": 308.9,
"r_y3": 489.1,
"coord_origin": "TOPLEFT"
},
"text": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-",
"orig": "tags [37, 17] or LaTeX symbols[10]. The choice of sym-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 509.9,
"r_x1": 545.1,
"r_y1": 509.9,
"r_x2": 545.1,
"r_y2": 501.0,
"r_x3": 308.9,
"r_y3": 501.0,
"coord_origin": "TOPLEFT"
},
"text": "bols is ultimately not very important, since one can be trans-",
"orig": "bols is ultimately not very important, since one can be trans-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 521.9,
"r_x1": 545.1,
"r_y1": 521.9,
"r_x2": 545.1,
"r_y2": 513.0,
"r_x3": 308.9,
"r_y3": 513.0,
"coord_origin": "TOPLEFT"
},
"text": "formed into the other. There are however subtle variations",
"orig": "formed into the other. There are however subtle variations",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 533.8,
"r_x1": 545.1,
"r_y1": 533.8,
"r_x2": 545.1,
"r_y2": 524.9,
"r_x3": 308.9,
"r_y3": 524.9,
"coord_origin": "TOPLEFT"
},
"text": "in the Image-to-Text networks. The easiest network archi-",
"orig": "in the Image-to-Text networks. The easiest network archi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 545.8,
"r_x1": 420.9,
"r_y1": 545.8,
"r_x2": 420.9,
"r_y2": 536.9,
"r_x3": 308.9,
"r_y3": 536.9,
"coord_origin": "TOPLEFT"
},
"text": "tectures are \u201cimage-encoder",
"orig": "tectures are \u201cimage-encoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 423.6,
"r_y0": 545.6,
"r_x1": 433.6,
"r_y1": 545.6,
"r_x2": 433.6,
"r_y2": 536.2,
"r_x3": 423.6,
"r_y3": 536.2,
"coord_origin": "TOPLEFT"
},
"text": "\u2192",
"orig": "\u2192",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 436.2,
"r_y0": 545.8,
"r_x1": 545.1,
"r_y1": 545.8,
"r_x2": 545.1,
"r_y2": 536.9,
"r_x3": 436.2,
"r_y3": 536.9,
"coord_origin": "TOPLEFT"
},
"text": "text-decoder\u201d (IETD), sim-",
"orig": "text-decoder\u201d (IETD), sim-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 557.7,
"r_x1": 545.1,
"r_y1": 557.7,
"r_x2": 545.1,
"r_y2": 548.8,
"r_x3": 308.9,
"r_y3": 548.8,
"coord_origin": "TOPLEFT"
},
"text": "ilar to network architectures that try to provide captions to",
"orig": "ilar to network architectures that try to provide captions to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 569.7,
"r_x1": 545.1,
"r_y1": 569.7,
"r_x2": 545.1,
"r_y2": 560.8,
"r_x3": 308.9,
"r_y3": 560.8,
"coord_origin": "TOPLEFT"
},
"text": "images [32]. In these IETD networks, one expects as output",
"orig": "images [32]. In these IETD networks, one expects as output",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 581.6,
"r_x1": 545.1,
"r_y1": 581.6,
"r_x2": 545.1,
"r_y2": 572.7,
"r_x3": 308.9,
"r_y3": 572.7,
"coord_origin": "TOPLEFT"
},
"text": "the LaTeX/HTML string of the entire table, i.e. the sym-",
"orig": "the LaTeX/HTML string of the entire table, i.e. the sym-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 593.6,
"r_x1": 545.1,
"r_y1": 593.6,
"r_x2": 545.1,
"r_y2": 584.7,
"r_x3": 308.9,
"r_y3": 584.7,
"coord_origin": "TOPLEFT"
},
"text": "bols necessary for creating the table with the content of the",
"orig": "bols necessary for creating the table with the content of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 605.6,
"r_x1": 497.1,
"r_y1": 605.6,
"r_x2": 497.1,
"r_y2": 596.6,
"r_x3": 308.9,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "table. Another approach is the \u201cimage-encoder",
"orig": "table. Another approach is the \u201cimage-encoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.8,
"r_y0": 605.3,
"r_x1": 509.8,
"r_y1": 605.3,
"r_x2": 509.8,
"r_y2": 595.9,
"r_x3": 499.8,
"r_y3": 595.9,
"coord_origin": "TOPLEFT"
},
"text": "\u2192",
"orig": "\u2192",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.5,
"r_y0": 605.6,
"r_x1": 545.1,
"r_y1": 605.6,
"r_x2": 545.1,
"r_y2": 596.6,
"r_x3": 512.5,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "dual de-",
"orig": "dual de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 617.5,
"r_x1": 545.1,
"r_y1": 617.5,
"r_x2": 545.1,
"r_y2": 608.6,
"r_x3": 308.9,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "coder\u201d (IEDD) networks. In these type of networks, one has",
"orig": "coder\u201d (IEDD) networks. In these type of networks, one has",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 629.5,
"r_x1": 545.1,
"r_y1": 629.5,
"r_x2": 545.1,
"r_y2": 620.6,
"r_x3": 308.9,
"r_y3": 620.6,
"coord_origin": "TOPLEFT"
},
"text": "two consecutive decoders with different purposes. The first",
"orig": "two consecutive decoders with different purposes. The first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 641.4,
"r_x1": 364.8,
"r_y1": 641.4,
"r_x2": 364.8,
"r_y2": 632.5,
"r_x3": 308.9,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": "decoder is the",
"orig": "decoder is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.6,
"r_y0": 641.2,
"r_x1": 415.6,
"r_y1": 641.2,
"r_x2": 415.6,
"r_y2": 632.6,
"r_x3": 367.6,
"r_y3": 632.6,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder",
"orig": "tag-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 415.6,
"r_y0": 641.4,
"r_x1": 545.1,
"r_y1": 641.4,
"r_x2": 545.1,
"r_y2": 632.5,
"r_x3": 415.6,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": ", i.e. it only produces the HTM-",
"orig": ", i.e. it only produces the HTM-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 653.4,
"r_x1": 545.1,
"r_y1": 653.4,
"r_x2": 545.1,
"r_y2": 644.5,
"r_x3": 308.9,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "L/LaTeX tags which construct an empty table. The second",
"orig": "L/LaTeX tags which construct an empty table. The second",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 665.1,
"r_x1": 373.6,
"r_y1": 665.1,
"r_x2": 373.6,
"r_y2": 656.5,
"r_x3": 308.9,
"r_y3": 656.5,
"coord_origin": "TOPLEFT"
},
"text": "content-decoder",
"orig": "content-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 376.9,
"r_y0": 665.3,
"r_x1": 545.1,
"r_y1": 665.3,
"r_x2": 545.1,
"r_y2": 656.4,
"r_x3": 376.9,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "uses the encoding of the image in combi-",
"orig": "uses the encoding of the image in combi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 677.3,
"r_x1": 545.1,
"r_y1": 677.3,
"r_x2": 545.1,
"r_y2": 668.4,
"r_x3": 308.9,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "nation with the output encoding of each cell-tag (from the",
"orig": "nation with the output encoding of each cell-tag (from the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 689.0,
"r_x1": 356.9,
"r_y1": 689.0,
"r_x2": 356.9,
"r_y2": 680.4,
"r_x3": 308.9,
"r_y3": 680.4,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder",
"orig": "tag-decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.1,
"r_y0": 689.2,
"r_x1": 545.1,
"r_y1": 689.2,
"r_x2": 545.1,
"r_y2": 680.3,
"r_x3": 357.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": ") to generate the textual content of each table",
"orig": ") to generate the textual content of each table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 308.9,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "cell. The network architecture of IEDD is certainly more",
"orig": "cell. The network architecture of IEDD is certainly more",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 545.1,
"r_y1": 713.2,
"r_x2": 545.1,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "elaborate, but it has the advantage that one can pre-train the",
"orig": "elaborate, but it has the advantage that one can pre-train the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Image-to-Text networks : In this type of network, one predicts a sequence of tokens starting from an encoded image. Such sequences of tokens can be HTML table tags [37, 17] or LaTeX symbols[10]. The choice of symbols is ultimately not very important, since one can be transformed into the other. There are however subtle variations in the Image-to-Text networks. The easiest network architectures are \"image-encoder \u2192 text-decoder\" (IETD), similar to network architectures that try to provide captions to images [32]. In these IETD networks, one expects as output the LaTeX/HTML string of the entire table, i.e. the symbols necessary for creating the table with the content of the table. Another approach is the \"image-encoder \u2192 dual decoder\" (IEDD) networks. In these type of networks, one has two consecutive decoders with different purposes. The first decoder is the tag-decoder , i.e. it only produces the HTML/LaTeX tags which construct an empty table. The second content-decoder uses the encoding of the image in combination with the output encoding of each cell-tag (from the tag-decoder ) to generate the textual content of each table cell. The network architecture of IEDD is certainly more elaborate, but it has the advantage that one can pre-train the"
}
],
"headers": [
{
"label": "page_footer",
"id": 15,
"page_no": 1,
"cluster": {
"id": 15,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "2"
}
]
}
},
{
"page_no": 2,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.1,
"r_x1": 250.2,
"r_y1": 84.1,
"r_x2": 250.2,
"r_y2": 75.2,
"r_x3": 50.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder which is constrained to the table-tags.",
"orig": "tag-decoder which is constrained to the table-tags.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 96.1,
"r_x1": 70.4,
"r_y1": 96.1,
"r_x2": 70.4,
"r_y2": 87.2,
"r_x3": 62.1,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.9,
"r_y0": 96.1,
"r_x1": 111.0,
"r_y1": 96.1,
"r_x2": 111.0,
"r_y2": 87.2,
"r_x3": 76.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "practice,",
"orig": "practice,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 118.5,
"r_y0": 96.1,
"r_x1": 136.3,
"r_y1": 96.1,
"r_x2": 136.3,
"r_y2": 87.2,
"r_x3": 118.5,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "both",
"orig": "both",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 142.8,
"r_y0": 96.1,
"r_x1": 175.4,
"r_y1": 96.1,
"r_x2": 175.4,
"r_y2": 87.2,
"r_x3": 142.8,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "network",
"orig": "network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 181.9,
"r_y0": 96.1,
"r_x1": 232.8,
"r_y1": 96.1,
"r_x2": 232.8,
"r_y2": 87.2,
"r_x3": 181.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "architectures",
"orig": "architectures",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.4,
"r_y0": 96.1,
"r_x1": 265.4,
"r_y1": 96.1,
"r_x2": 265.4,
"r_y2": 87.2,
"r_x3": 239.4,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "(IETD",
"orig": "(IETD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 272.0,
"r_y0": 96.1,
"r_x1": 286.4,
"r_y1": 96.1,
"r_x2": 286.4,
"r_y2": 87.2,
"r_x3": 272.0,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 108.1,
"r_x1": 286.4,
"r_y1": 108.1,
"r_x2": 286.4,
"r_y2": 99.2,
"r_x3": 50.1,
"r_y3": 99.2,
"coord_origin": "TOPLEFT"
},
"text": "IEDD) require an implicit, custom trained object-character-",
"orig": "IEDD) require an implicit, custom trained object-character-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 120.0,
"r_x1": 286.4,
"r_y1": 120.0,
"r_x2": 286.4,
"r_y2": 111.1,
"r_x3": 50.1,
"r_y3": 111.1,
"coord_origin": "TOPLEFT"
},
"text": "recognition (OCR) to obtain the content of the table-cells.",
"orig": "recognition (OCR) to obtain the content of the table-cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 132.0,
"r_x1": 286.4,
"r_y1": 132.0,
"r_x2": 286.4,
"r_y2": 123.1,
"r_x3": 50.1,
"r_y3": 123.1,
"coord_origin": "TOPLEFT"
},
"text": "In the case of IETD, this OCR engine is implicit in the de-",
"orig": "In the case of IETD, this OCR engine is implicit in the de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 143.9,
"r_x1": 286.4,
"r_y1": 143.9,
"r_x2": 286.4,
"r_y2": 135.0,
"r_x3": 50.1,
"r_y3": 135.0,
"coord_origin": "TOPLEFT"
},
"text": "coder similar to [24]. For the IEDD, the OCR is solely em-",
"orig": "coder similar to [24]. For the IEDD, the OCR is solely em-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 155.9,
"r_x1": 286.4,
"r_y1": 155.9,
"r_x2": 286.4,
"r_y2": 147.0,
"r_x3": 50.1,
"r_y3": 147.0,
"coord_origin": "TOPLEFT"
},
"text": "bedded in the content-decoder. This reliance on a custom,",
"orig": "bedded in the content-decoder. This reliance on a custom,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 167.9,
"r_x1": 286.4,
"r_y1": 167.9,
"r_x2": 286.4,
"r_y2": 159.0,
"r_x3": 50.1,
"r_y3": 159.0,
"coord_origin": "TOPLEFT"
},
"text": "implicit OCR decoder is of course problematic. OCR is a",
"orig": "implicit OCR decoder is of course problematic. OCR is a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 179.8,
"r_x1": 286.4,
"r_y1": 179.8,
"r_x2": 286.4,
"r_y2": 170.9,
"r_x3": 50.1,
"r_y3": 170.9,
"coord_origin": "TOPLEFT"
},
"text": "well known and extremely tough problem, that often needs",
"orig": "well known and extremely tough problem, that often needs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 191.8,
"r_x1": 286.4,
"r_y1": 191.8,
"r_x2": 286.4,
"r_y2": 182.9,
"r_x3": 50.1,
"r_y3": 182.9,
"coord_origin": "TOPLEFT"
},
"text": "custom training for each individual language. However, the",
"orig": "custom training for each individual language. However, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 203.7,
"r_x1": 286.4,
"r_y1": 203.7,
"r_x2": 286.4,
"r_y2": 194.8,
"r_x3": 50.1,
"r_y3": 194.8,
"coord_origin": "TOPLEFT"
},
"text": "limited availability for non-english content in the current",
"orig": "limited availability for non-english content in the current",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 215.7,
"r_x1": 286.4,
"r_y1": 215.7,
"r_x2": 286.4,
"r_y2": 206.8,
"r_x3": 50.1,
"r_y3": 206.8,
"coord_origin": "TOPLEFT"
},
"text": "datasets, makes it impractical to apply the IETD and IEDD",
"orig": "datasets, makes it impractical to apply the IETD and IEDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 227.6,
"r_x1": 286.4,
"r_y1": 227.6,
"r_x2": 286.4,
"r_y2": 218.7,
"r_x3": 50.1,
"r_y3": 218.7,
"coord_origin": "TOPLEFT"
},
"text": "methods on tables with other languages. Additionally, OCR",
"orig": "methods on tables with other languages. Additionally, OCR",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 239.6,
"r_x1": 286.4,
"r_y1": 239.6,
"r_x2": 286.4,
"r_y2": 230.7,
"r_x3": 50.1,
"r_y3": 230.7,
"coord_origin": "TOPLEFT"
},
"text": "can be completely omitted if the tables originate from pro-",
"orig": "can be completely omitted if the tables originate from pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 251.5,
"r_x1": 286.4,
"r_y1": 251.5,
"r_x2": 286.4,
"r_y2": 242.6,
"r_x3": 50.1,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "grammatic PDF documents with known positions of each",
"orig": "grammatic PDF documents with known positions of each",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 263.5,
"r_x1": 286.4,
"r_y1": 263.5,
"r_x2": 286.4,
"r_y2": 254.6,
"r_x3": 50.1,
"r_y3": 254.6,
"coord_origin": "TOPLEFT"
},
"text": "cell. The latter was the inspiration for the work of this pa-",
"orig": "cell. The latter was the inspiration for the work of this pa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 275.5,
"r_x1": 64.8,
"r_y1": 275.5,
"r_x2": 64.8,
"r_y2": 266.5,
"r_x3": 50.1,
"r_y3": 266.5,
"coord_origin": "TOPLEFT"
},
"text": "per.",
"orig": "per.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 287.4,
"r_x1": 171.6,
"r_y1": 287.4,
"r_x2": 171.6,
"r_y2": 278.4,
"r_x3": 62.1,
"r_y3": 278.4,
"coord_origin": "TOPLEFT"
},
"text": "Graph Neural networks",
"orig": "Graph Neural networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.6,
"r_y0": 287.5,
"r_x1": 174.3,
"r_y1": 287.5,
"r_x2": 174.3,
"r_y2": 278.6,
"r_x3": 171.6,
"r_y3": 278.6,
"coord_origin": "TOPLEFT"
},
"text": ":",
"orig": ":",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.2,
"r_y0": 287.5,
"r_x1": 286.4,
"r_y1": 287.5,
"r_x2": 286.4,
"r_y2": 278.6,
"r_x3": 185.2,
"r_y3": 278.6,
"coord_origin": "TOPLEFT"
},
"text": "Graph Neural networks",
"orig": "Graph Neural networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 299.4,
"r_x1": 286.4,
"r_y1": 299.4,
"r_x2": 286.4,
"r_y2": 290.5,
"r_x3": 50.1,
"r_y3": 290.5,
"coord_origin": "TOPLEFT"
},
"text": "(GNN\u2019s) take a radically different approach to table-",
"orig": "(GNN\u2019s) take a radically different approach to table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 311.4,
"r_x1": 131.2,
"r_y1": 311.4,
"r_x2": 131.2,
"r_y2": 302.5,
"r_x3": 50.1,
"r_y3": 302.5,
"coord_origin": "TOPLEFT"
},
"text": "structure extraction.",
"orig": "structure extraction.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.8,
"r_y0": 311.4,
"r_x1": 286.4,
"r_y1": 311.4,
"r_x2": 286.4,
"r_y2": 302.5,
"r_x3": 138.8,
"r_y3": 302.5,
"coord_origin": "TOPLEFT"
},
"text": "Note that one table cell can consti-",
"orig": "Note that one table cell can consti-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 323.3,
"r_x1": 286.4,
"r_y1": 323.3,
"r_x2": 286.4,
"r_y2": 314.4,
"r_x3": 50.1,
"r_y3": 314.4,
"coord_origin": "TOPLEFT"
},
"text": "tute out of multiple text-cells. To obtain the table-structure,",
"orig": "tute out of multiple text-cells. To obtain the table-structure,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 335.3,
"r_x1": 286.4,
"r_y1": 335.3,
"r_x2": 286.4,
"r_y2": 326.4,
"r_x3": 50.1,
"r_y3": 326.4,
"coord_origin": "TOPLEFT"
},
"text": "one creates an initial graph, where each of the text-cells",
"orig": "one creates an initial graph, where each of the text-cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 347.2,
"r_x1": 286.4,
"r_y1": 347.2,
"r_x2": 286.4,
"r_y2": 338.3,
"r_x3": 50.1,
"r_y3": 338.3,
"coord_origin": "TOPLEFT"
},
"text": "becomes a node in the graph similar to [33, 34, 2]. Each",
"orig": "becomes a node in the graph similar to [33, 34, 2]. Each",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 359.2,
"r_x1": 286.4,
"r_y1": 359.2,
"r_x2": 286.4,
"r_y2": 350.3,
"r_x3": 50.1,
"r_y3": 350.3,
"coord_origin": "TOPLEFT"
},
"text": "node is then associated with en embedding vector coming",
"orig": "node is then associated with en embedding vector coming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 371.2,
"r_x1": 286.4,
"r_y1": 371.2,
"r_x2": 286.4,
"r_y2": 362.2,
"r_x3": 50.1,
"r_y3": 362.2,
"coord_origin": "TOPLEFT"
},
"text": "from the encoded image, its coordinates and the encoded",
"orig": "from the encoded image, its coordinates and the encoded",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 383.1,
"r_x1": 286.4,
"r_y1": 383.1,
"r_x2": 286.4,
"r_y2": 374.2,
"r_x3": 50.1,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "text. Furthermore, nodes that represent adjacent text-cells",
"orig": "text. Furthermore, nodes that represent adjacent text-cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 395.1,
"r_x1": 286.4,
"r_y1": 395.1,
"r_x2": 286.4,
"r_y2": 386.2,
"r_x3": 50.1,
"r_y3": 386.2,
"coord_origin": "TOPLEFT"
},
"text": "are linked. Graph Convolutional Networks (GCN\u2019s) based",
"orig": "are linked. Graph Convolutional Networks (GCN\u2019s) based",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 407.0,
"r_x1": 286.4,
"r_y1": 407.0,
"r_x2": 286.4,
"r_y2": 398.1,
"r_x3": 50.1,
"r_y3": 398.1,
"coord_origin": "TOPLEFT"
},
"text": "methods take the image as an input, but also the position of",
"orig": "methods take the image as an input, but also the position of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 419.0,
"r_x1": 286.4,
"r_y1": 419.0,
"r_x2": 286.4,
"r_y2": 410.1,
"r_x3": 50.1,
"r_y3": 410.1,
"coord_origin": "TOPLEFT"
},
"text": "the text-cells and their content [18]. The purpose of a GCN",
"orig": "the text-cells and their content [18]. The purpose of a GCN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 430.9,
"r_x1": 286.4,
"r_y1": 430.9,
"r_x2": 286.4,
"r_y2": 422.0,
"r_x3": 50.1,
"r_y3": 422.0,
"coord_origin": "TOPLEFT"
},
"text": "is to transform the input graph into a new graph, which re-",
"orig": "is to transform the input graph into a new graph, which re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 442.9,
"r_x1": 198.2,
"r_y1": 442.9,
"r_x2": 198.2,
"r_y2": 434.0,
"r_x3": 50.1,
"r_y3": 434.0,
"coord_origin": "TOPLEFT"
},
"text": "places the old links with new ones.",
"orig": "places the old links with new ones.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 205.9,
"r_y0": 442.9,
"r_x1": 286.4,
"r_y1": 442.9,
"r_x2": 286.4,
"r_y2": 434.0,
"r_x3": 205.9,
"r_y3": 434.0,
"coord_origin": "TOPLEFT"
},
"text": "The new links then",
"orig": "The new links then",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 454.8,
"r_x1": 286.4,
"r_y1": 454.8,
"r_x2": 286.4,
"r_y2": 445.9,
"r_x3": 50.1,
"r_y3": 445.9,
"coord_origin": "TOPLEFT"
},
"text": "represent the table-structure. With this approach, one can",
"orig": "represent the table-structure. With this approach, one can",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 466.8,
"r_x1": 286.4,
"r_y1": 466.8,
"r_x2": 286.4,
"r_y2": 457.9,
"r_x3": 50.1,
"r_y3": 457.9,
"coord_origin": "TOPLEFT"
},
"text": "avoid the need to build custom OCR decoders. However,",
"orig": "avoid the need to build custom OCR decoders. However,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 478.7,
"r_x1": 286.4,
"r_y1": 478.7,
"r_x2": 286.4,
"r_y2": 469.8,
"r_x3": 50.1,
"r_y3": 469.8,
"coord_origin": "TOPLEFT"
},
"text": "the quality of the reconstructed structure is not comparable",
"orig": "the quality of the reconstructed structure is not comparable",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 490.7,
"r_x1": 186.5,
"r_y1": 490.7,
"r_x2": 186.5,
"r_y2": 481.8,
"r_x3": 50.1,
"r_y3": 481.8,
"coord_origin": "TOPLEFT"
},
"text": "to the current state-of-the-art [18].",
"orig": "to the current state-of-the-art [18].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 502.6,
"r_x1": 252.9,
"r_y1": 502.6,
"r_x2": 252.9,
"r_y2": 493.7,
"r_x3": 62.1,
"r_y3": 493.7,
"coord_origin": "TOPLEFT"
},
"text": "Hybrid Deep Learning-Rule-Based approach",
"orig": "Hybrid Deep Learning-Rule-Based approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 252.9,
"r_y0": 502.7,
"r_x1": 286.4,
"r_y1": 502.7,
"r_x2": 286.4,
"r_y2": 493.8,
"r_x3": 252.9,
"r_y3": 493.8,
"coord_origin": "TOPLEFT"
},
"text": ": A pop-",
"orig": ": A pop-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 514.7,
"r_x1": 286.4,
"r_y1": 514.7,
"r_x2": 286.4,
"r_y2": 505.8,
"r_x3": 50.1,
"r_y3": 505.8,
"coord_origin": "TOPLEFT"
},
"text": "ular current model for table-structure identification is the",
"orig": "ular current model for table-structure identification is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 526.6,
"r_x1": 286.4,
"r_y1": 526.6,
"r_x2": 286.4,
"r_y2": 517.7,
"r_x3": 50.1,
"r_y3": 517.7,
"coord_origin": "TOPLEFT"
},
"text": "use of a hybrid Deep Learning-Rule-Based approach similar",
"orig": "use of a hybrid Deep Learning-Rule-Based approach similar",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 538.6,
"r_x1": 286.4,
"r_y1": 538.6,
"r_x2": 286.4,
"r_y2": 529.7,
"r_x3": 50.1,
"r_y3": 529.7,
"coord_origin": "TOPLEFT"
},
"text": "to [27, 29]. In this approach, one first detects the position of",
"orig": "to [27, 29]. In this approach, one first detects the position of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 550.5,
"r_x1": 286.4,
"r_y1": 550.5,
"r_x2": 286.4,
"r_y2": 541.6,
"r_x3": 50.1,
"r_y3": 541.6,
"coord_origin": "TOPLEFT"
},
"text": "the table-cells with object detection (e.g. YoloVx or Mask-",
"orig": "the table-cells with object detection (e.g. YoloVx or Mask-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 562.5,
"r_x1": 286.4,
"r_y1": 562.5,
"r_x2": 286.4,
"r_y2": 553.6,
"r_x3": 50.1,
"r_y3": 553.6,
"coord_origin": "TOPLEFT"
},
"text": "RCNN), then classifies the table into different types (from",
"orig": "RCNN), then classifies the table into different types (from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 574.4,
"r_x1": 286.4,
"r_y1": 574.4,
"r_x2": 286.4,
"r_y2": 565.5,
"r_x3": 50.1,
"r_y3": 565.5,
"coord_origin": "TOPLEFT"
},
"text": "its images) and finally uses different rule-sets to obtain",
"orig": "its images) and finally uses different rule-sets to obtain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 586.4,
"r_x1": 286.4,
"r_y1": 586.4,
"r_x2": 286.4,
"r_y2": 577.5,
"r_x3": 50.1,
"r_y3": 577.5,
"coord_origin": "TOPLEFT"
},
"text": "its table-structure. Currently, this approach achieves state-",
"orig": "its table-structure. Currently, this approach achieves state-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 598.4,
"r_x1": 286.4,
"r_y1": 598.4,
"r_x2": 286.4,
"r_y2": 589.4,
"r_x3": 50.1,
"r_y3": 589.4,
"coord_origin": "TOPLEFT"
},
"text": "of-the-art results, but is not an end-to-end deep-learning",
"orig": "of-the-art results, but is not an end-to-end deep-learning",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 610.3,
"r_x1": 286.4,
"r_y1": 610.3,
"r_x2": 286.4,
"r_y2": 601.4,
"r_x3": 50.1,
"r_y3": 601.4,
"coord_origin": "TOPLEFT"
},
"text": "method. As such, new rules need to be written if different",
"orig": "method. As such, new rules need to be written if different",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 622.3,
"r_x1": 176.0,
"r_y1": 622.3,
"r_x2": 176.0,
"r_y2": 613.4,
"r_x3": 50.1,
"r_y3": 613.4,
"coord_origin": "TOPLEFT"
},
"text": "types of tables are encountered.",
"orig": "types of tables are encountered.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 646.7,
"r_x1": 57.8,
"r_y1": 646.7,
"r_x2": 57.8,
"r_y2": 635.9,
"r_x3": 50.1,
"r_y3": 635.9,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.1,
"r_y0": 646.7,
"r_x1": 105.2,
"r_y1": 646.7,
"r_x2": 105.2,
"r_y2": 635.9,
"r_x3": 68.1,
"r_y3": 635.9,
"coord_origin": "TOPLEFT"
},
"text": "Datasets",
"orig": "Datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 665.3,
"r_x1": 286.4,
"r_y1": 665.3,
"r_x2": 286.4,
"r_y2": 656.4,
"r_x3": 62.1,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "We rely on large-scale datasets such as PubTabNet [37],",
"orig": "We rely on large-scale datasets such as PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.3,
"r_x1": 286.4,
"r_y1": 677.3,
"r_x2": 286.4,
"r_y2": 668.4,
"r_x3": 50.1,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet [36], and TableBank [17] datasets to train and",
"orig": "FinTabNet [36], and TableBank [17] datasets to train and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 689.2,
"r_x1": 286.4,
"r_y1": 689.2,
"r_x2": 286.4,
"r_y2": 680.3,
"r_x3": 50.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "evaluate our models. These datasets span over various ap-",
"orig": "evaluate our models. These datasets span over various ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 166.2,
"r_y1": 701.2,
"r_x2": 166.2,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "pearance styles and content.",
"orig": "pearance styles and content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 173.7,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 173.7,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "We also introduce our own",
"orig": "We also introduce our own",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 286.4,
"r_y1": 713.2,
"r_x2": 286.4,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "synthetically generated SynthTabNet dataset to fix an im-",
"orig": "synthetically generated SynthTabNet dataset to fix an im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 380.8,
"r_y0": 88.6,
"r_x1": 486.8,
"r_y1": 88.6,
"r_x2": 486.8,
"r_y2": 79.8,
"r_x3": 380.8,
"r_y3": 79.8,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet + FinTabNet",
"orig": "PubTabNet + FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.8,
"r_y0": 250.8,
"r_x1": 469.8,
"r_y1": 250.8,
"r_x2": 469.8,
"r_y2": 242.0,
"r_x3": 396.8,
"r_y3": 242.0,
"coord_origin": "TOPLEFT"
},
"text": "Rows / Columns",
"orig": "Rows / Columns",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 321.0,
"r_y0": 239.3,
"r_x1": 324.8,
"r_y1": 239.3,
"r_x2": 324.8,
"r_y2": 233.4,
"r_x3": 321.0,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.5,
"r_y0": 239.3,
"r_x1": 418.1,
"r_y1": 239.3,
"r_x2": 418.1,
"r_y2": 233.4,
"r_x3": 410.5,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.8,
"r_y0": 239.3,
"r_x1": 508.5,
"r_y1": 239.3,
"r_x2": 508.5,
"r_y2": 233.4,
"r_x3": 500.8,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 365.3,
"r_y0": 239.3,
"r_x1": 372.9,
"r_y1": 239.3,
"r_x2": 372.9,
"r_y2": 233.4,
"r_x3": 365.3,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.7,
"r_y0": 239.3,
"r_x1": 463.3,
"r_y1": 239.3,
"r_x2": 463.3,
"r_y2": 233.4,
"r_x3": 455.7,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 542.0,
"r_y0": 239.3,
"r_x1": 549.7,
"r_y1": 239.3,
"r_x2": 549.7,
"r_y2": 233.4,
"r_x3": 542.0,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.0,
"r_y0": 236.3,
"r_x1": 319.9,
"r_y1": 236.3,
"r_x2": 319.9,
"r_y2": 230.4,
"r_x3": 316.0,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.6,
"r_y0": 204.5,
"r_x1": 316.4,
"r_y1": 204.5,
"r_x2": 316.4,
"r_y2": 198.7,
"r_x3": 312.6,
"r_y3": 198.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.4,
"r_y0": 204.5,
"r_x1": 320.3,
"r_y1": 204.5,
"r_x2": 320.3,
"r_y2": 198.7,
"r_x3": 316.4,
"r_y3": 198.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.1,
"r_y0": 173.9,
"r_x1": 317.0,
"r_y1": 173.9,
"r_x2": 317.0,
"r_y2": 168.1,
"r_x3": 313.1,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.0,
"r_y0": 173.9,
"r_x1": 320.8,
"r_y1": 173.9,
"r_x2": 320.8,
"r_y2": 168.1,
"r_x3": 317.0,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.9,
"r_y0": 142.4,
"r_x1": 316.7,
"r_y1": 142.4,
"r_x2": 316.7,
"r_y2": 136.6,
"r_x3": 312.9,
"r_y3": 136.6,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.7,
"r_y0": 142.4,
"r_x1": 320.6,
"r_y1": 142.4,
"r_x2": 320.6,
"r_y2": 136.6,
"r_x3": 316.7,
"r_y3": 136.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.5,
"r_y0": 111.4,
"r_x1": 316.3,
"r_y1": 111.4,
"r_x2": 316.3,
"r_y2": 105.6,
"r_x3": 312.5,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 111.4,
"r_x1": 320.1,
"r_y1": 111.4,
"r_x2": 320.1,
"r_y2": 105.6,
"r_x3": 316.3,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.5,
"r_y0": 218.1,
"r_x1": 316.3,
"r_y1": 218.1,
"r_x2": 316.3,
"r_y2": 212.3,
"r_x3": 312.5,
"r_y3": 212.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 218.1,
"r_x1": 320.1,
"r_y1": 218.1,
"r_x2": 320.1,
"r_y2": 212.3,
"r_x3": 316.3,
"r_y3": 212.3,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.1,
"r_y0": 189.6,
"r_x1": 316.9,
"r_y1": 189.6,
"r_x2": 316.9,
"r_y2": 183.7,
"r_x3": 313.1,
"r_y3": 183.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.9,
"r_y0": 189.6,
"r_x1": 320.7,
"r_y1": 189.6,
"r_x2": 320.7,
"r_y2": 183.7,
"r_x3": 316.9,
"r_y3": 183.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.8,
"r_y0": 158.3,
"r_x1": 316.6,
"r_y1": 158.3,
"r_x2": 316.6,
"r_y2": 152.5,
"r_x3": 312.8,
"r_y3": 152.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.6,
"r_y0": 158.3,
"r_x1": 320.4,
"r_y1": 158.3,
"r_x2": 320.4,
"r_y2": 152.5,
"r_x3": 316.6,
"r_y3": 152.5,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.2,
"r_y0": 126.4,
"r_x1": 316.0,
"r_y1": 126.4,
"r_x2": 316.0,
"r_y2": 120.6,
"r_x3": 312.2,
"r_y3": 120.6,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.0,
"r_y0": 126.4,
"r_x1": 319.8,
"r_y1": 126.4,
"r_x2": 319.8,
"r_y2": 120.6,
"r_x3": 316.0,
"r_y3": 120.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.8,
"r_y0": 95.9,
"r_x1": 316.6,
"r_y1": 95.9,
"r_x2": 316.6,
"r_y2": 90.1,
"r_x3": 312.8,
"r_y3": 90.1,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.6,
"r_y0": 95.9,
"r_x1": 320.4,
"r_y1": 95.9,
"r_x2": 320.4,
"r_y2": 90.1,
"r_x3": 316.6,
"r_y3": 90.1,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.2,
"r_y0": 230.0,
"r_x1": 536.9,
"r_y1": 230.0,
"r_x2": 536.9,
"r_y2": 222.7,
"r_x3": 532.2,
"r_y3": 222.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.9,
"r_y0": 115.6,
"r_x1": 547.6,
"r_y1": 115.6,
"r_x2": 547.6,
"r_y2": 108.3,
"r_x3": 532.9,
"r_y3": 108.3,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.8,
"r_y0": 138.1,
"r_x1": 542.7,
"r_y1": 138.1,
"r_x2": 542.7,
"r_y2": 130.8,
"r_x3": 532.8,
"r_y3": 130.8,
"coord_origin": "TOPLEFT"
},
"text": "8K",
"orig": "8K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.8,
"r_y0": 161.2,
"r_x1": 542.8,
"r_y1": 161.2,
"r_x2": 542.8,
"r_y2": 153.9,
"r_x3": 532.8,
"r_y3": 153.9,
"coord_origin": "TOPLEFT"
},
"text": "6K",
"orig": "6K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.6,
"r_y0": 184.0,
"r_x1": 542.5,
"r_y1": 184.0,
"r_x2": 542.5,
"r_y2": 176.8,
"r_x3": 532.6,
"r_y3": 176.8,
"coord_origin": "TOPLEFT"
},
"text": "4K",
"orig": "4K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.1,
"r_y0": 206.9,
"r_x1": 542.1,
"r_y1": 206.9,
"r_x2": 542.1,
"r_y2": 199.6,
"r_x3": 532.1,
"r_y3": 199.6,
"coord_origin": "TOPLEFT"
},
"text": "2K",
"orig": "2K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 276.7,
"r_x1": 346.1,
"r_y1": 276.7,
"r_x2": 346.1,
"r_y2": 267.8,
"r_x3": 308.9,
"r_y3": 267.8,
"coord_origin": "TOPLEFT"
},
"text": "Figure 2:",
"orig": "Figure 2:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.5,
"r_y0": 276.7,
"r_x1": 545.1,
"r_y1": 276.7,
"r_x2": 545.1,
"r_y2": 267.8,
"r_x3": 354.5,
"r_y3": 267.8,
"coord_origin": "TOPLEFT"
},
"text": "Distribution of the tables across different table",
"orig": "Distribution of the tables across different table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 288.7,
"r_x1": 498.6,
"r_y1": 288.7,
"r_x2": 498.6,
"r_y2": 279.8,
"r_x3": 308.9,
"r_y3": 279.8,
"coord_origin": "TOPLEFT"
},
"text": "dimensions in PubTabNet + FinTabNet datasets",
"orig": "dimensions in PubTabNet + FinTabNet datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 326.4,
"r_x1": 437.3,
"r_y1": 326.4,
"r_x2": 437.3,
"r_y2": 317.5,
"r_x3": 308.9,
"r_y3": 317.5,
"coord_origin": "TOPLEFT"
},
"text": "balance in the previous datasets.",
"orig": "balance in the previous datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 340.4,
"r_x1": 545.1,
"r_y1": 340.4,
"r_x2": 545.1,
"r_y2": 331.5,
"r_x3": 320.8,
"r_y3": 331.5,
"coord_origin": "TOPLEFT"
},
"text": "The PubTabNet dataset contains 509k tables delivered as",
"orig": "The PubTabNet dataset contains 509k tables delivered as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 352.4,
"r_x1": 545.1,
"r_y1": 352.4,
"r_x2": 545.1,
"r_y2": 343.5,
"r_x3": 308.9,
"r_y3": 343.5,
"coord_origin": "TOPLEFT"
},
"text": "annotated PNG images. The annotations consist of the table",
"orig": "annotated PNG images. The annotations consist of the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 364.3,
"r_x1": 545.1,
"r_y1": 364.3,
"r_x2": 545.1,
"r_y2": 355.4,
"r_x3": 308.9,
"r_y3": 355.4,
"coord_origin": "TOPLEFT"
},
"text": "structure represented in HTML format, the tokenized text",
"orig": "structure represented in HTML format, the tokenized text",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 376.3,
"r_x1": 545.1,
"r_y1": 376.3,
"r_x2": 545.1,
"r_y2": 367.4,
"r_x3": 308.9,
"r_y3": 367.4,
"coord_origin": "TOPLEFT"
},
"text": "and its bounding boxes per table cell. Fig. 1 shows the ap-",
"orig": "and its bounding boxes per table cell. Fig. 1 shows the ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 388.3,
"r_x1": 545.1,
"r_y1": 388.3,
"r_x2": 545.1,
"r_y2": 379.4,
"r_x3": 308.9,
"r_y3": 379.4,
"coord_origin": "TOPLEFT"
},
"text": "pearance style of PubTabNet. Depending on its complexity,",
"orig": "pearance style of PubTabNet. Depending on its complexity,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 400.2,
"r_x1": 545.1,
"r_y1": 400.2,
"r_x2": 545.1,
"r_y2": 391.3,
"r_x3": 308.9,
"r_y3": 391.3,
"coord_origin": "TOPLEFT"
},
"text": "a table is characterized as \u201csimple\u201d when it does not contain",
"orig": "a table is characterized as \u201csimple\u201d when it does not contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 412.2,
"r_x1": 545.1,
"r_y1": 412.2,
"r_x2": 545.1,
"r_y2": 403.3,
"r_x3": 308.9,
"r_y3": 403.3,
"coord_origin": "TOPLEFT"
},
"text": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The",
"orig": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 424.1,
"r_x1": 545.1,
"r_y1": 424.1,
"r_x2": 545.1,
"r_y2": 415.2,
"r_x3": 308.9,
"r_y3": 415.2,
"coord_origin": "TOPLEFT"
},
"text": "dataset is divided into Train and Val splits (roughly 98% and",
"orig": "dataset is divided into Train and Val splits (roughly 98% and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 436.1,
"r_x1": 545.1,
"r_y1": 436.1,
"r_x2": 545.1,
"r_y2": 427.2,
"r_x3": 308.9,
"r_y3": 427.2,
"coord_origin": "TOPLEFT"
},
"text": "2%). The Train split consists of 54% simple and 46% com-",
"orig": "2%). The Train split consists of 54% simple and 46% com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 448.0,
"r_x1": 545.1,
"r_y1": 448.0,
"r_x2": 545.1,
"r_y2": 439.1,
"r_x3": 308.9,
"r_y3": 439.1,
"coord_origin": "TOPLEFT"
},
"text": "plex tables and the Val split of 51% and 49% respectively.",
"orig": "plex tables and the Val split of 51% and 49% respectively.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 460.0,
"r_x1": 545.1,
"r_y1": 460.0,
"r_x2": 545.1,
"r_y2": 451.1,
"r_x3": 308.9,
"r_y3": 451.1,
"coord_origin": "TOPLEFT"
},
"text": "The FinTabNet dataset contains 112k tables delivered as",
"orig": "The FinTabNet dataset contains 112k tables delivered as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 471.9,
"r_x1": 545.1,
"r_y1": 471.9,
"r_x2": 545.1,
"r_y2": 463.0,
"r_x3": 308.9,
"r_y3": 463.0,
"coord_origin": "TOPLEFT"
},
"text": "single-page PDF documents with mixed table structures and",
"orig": "single-page PDF documents with mixed table structures and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 483.9,
"r_x1": 545.1,
"r_y1": 483.9,
"r_x2": 545.1,
"r_y2": 475.0,
"r_x3": 308.9,
"r_y3": 475.0,
"coord_origin": "TOPLEFT"
},
"text": "text content. Similarly to the PubTabNet, the annotations",
"orig": "text content. Similarly to the PubTabNet, the annotations",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 495.9,
"r_x1": 545.1,
"r_y1": 495.9,
"r_x2": 545.1,
"r_y2": 486.9,
"r_x3": 308.9,
"r_y3": 486.9,
"coord_origin": "TOPLEFT"
},
"text": "of FinTabNet include the table structure in HTML, the to-",
"orig": "of FinTabNet include the table structure in HTML, the to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 507.8,
"r_x1": 545.1,
"r_y1": 507.8,
"r_x2": 545.1,
"r_y2": 498.9,
"r_x3": 308.9,
"r_y3": 498.9,
"coord_origin": "TOPLEFT"
},
"text": "kenized text and the bounding boxes on a table cell basis.",
"orig": "kenized text and the bounding boxes on a table cell basis.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 519.8,
"r_x1": 545.1,
"r_y1": 519.8,
"r_x2": 545.1,
"r_y2": 510.9,
"r_x3": 308.9,
"r_y3": 510.9,
"coord_origin": "TOPLEFT"
},
"text": "The dataset is divided into Train, Test and Val splits (81%,",
"orig": "The dataset is divided into Train, Test and Val splits (81%,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 531.7,
"r_x1": 545.1,
"r_y1": 531.7,
"r_x2": 545.1,
"r_y2": 522.8,
"r_x3": 308.9,
"r_y3": 522.8,
"coord_origin": "TOPLEFT"
},
"text": "9.5%, 9.5%), and each one is almost equally divided into",
"orig": "9.5%, 9.5%), and each one is almost equally divided into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 543.7,
"r_x1": 545.1,
"r_y1": 543.7,
"r_x2": 545.1,
"r_y2": 534.8,
"r_x3": 308.9,
"r_y3": 534.8,
"coord_origin": "TOPLEFT"
},
"text": "simple and complex tables (Train: 48% simple, 52% com-",
"orig": "simple and complex tables (Train: 48% simple, 52% com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 555.6,
"r_x1": 545.1,
"r_y1": 555.6,
"r_x2": 545.1,
"r_y2": 546.7,
"r_x3": 308.9,
"r_y3": 546.7,
"coord_origin": "TOPLEFT"
},
"text": "plex, Test: 48% simple, 52% complex, Test: 53% simple,",
"orig": "plex, Test: 48% simple, 52% complex, Test: 53% simple,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 567.6,
"r_x1": 545.1,
"r_y1": 567.6,
"r_x2": 545.1,
"r_y2": 558.7,
"r_x3": 308.9,
"r_y3": 558.7,
"coord_origin": "TOPLEFT"
},
"text": "47% complex). Finally the TableBank dataset consists of",
"orig": "47% complex). Finally the TableBank dataset consists of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 579.5,
"r_x1": 545.1,
"r_y1": 579.5,
"r_x2": 545.1,
"r_y2": 570.6,
"r_x3": 308.9,
"r_y3": 570.6,
"coord_origin": "TOPLEFT"
},
"text": "145k tables provided as JPEG images. The latter has anno-",
"orig": "145k tables provided as JPEG images. The latter has anno-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 591.5,
"r_x1": 545.1,
"r_y1": 591.5,
"r_x2": 545.1,
"r_y2": 582.6,
"r_x3": 308.9,
"r_y3": 582.6,
"coord_origin": "TOPLEFT"
},
"text": "tations for the table structure, but only few with bounding",
"orig": "tations for the table structure, but only few with bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 603.5,
"r_x1": 545.1,
"r_y1": 603.5,
"r_x2": 545.1,
"r_y2": 594.5,
"r_x3": 308.9,
"r_y3": 594.5,
"coord_origin": "TOPLEFT"
},
"text": "boxes of the table cells. The entire dataset consists of sim-",
"orig": "boxes of the table cells. The entire dataset consists of sim-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 615.4,
"r_x1": 545.1,
"r_y1": 615.4,
"r_x2": 545.1,
"r_y2": 606.5,
"r_x3": 308.9,
"r_y3": 606.5,
"coord_origin": "TOPLEFT"
},
"text": "ple tables and it is divided into 90% Train, 3% Test and 7%",
"orig": "ple tables and it is divided into 90% Train, 3% Test and 7%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 627.4,
"r_x1": 348.2,
"r_y1": 627.4,
"r_x2": 348.2,
"r_y2": 618.5,
"r_x3": 308.9,
"r_y3": 618.5,
"coord_origin": "TOPLEFT"
},
"text": "Val splits.",
"orig": "Val splits.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 641.4,
"r_x1": 545.1,
"r_y1": 641.4,
"r_x2": 545.1,
"r_y2": 632.5,
"r_x3": 320.8,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": "Due to the heterogeneity across the dataset formats, it",
"orig": "Due to the heterogeneity across the dataset formats, it",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 653.4,
"r_x1": 545.1,
"r_y1": 653.4,
"r_x2": 545.1,
"r_y2": 644.5,
"r_x3": 308.9,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "was necessary to combine all available data into one homog-",
"orig": "was necessary to combine all available data into one homog-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 665.3,
"r_x1": 545.1,
"r_y1": 665.3,
"r_x2": 545.1,
"r_y2": 656.4,
"r_x3": 308.9,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "enized dataset before we could train our models for practi-",
"orig": "enized dataset before we could train our models for practi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 677.3,
"r_x1": 545.1,
"r_y1": 677.3,
"r_x2": 545.1,
"r_y2": 668.4,
"r_x3": 308.9,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "cal purposes. Given the size of PubTabNet, we adopted its",
"orig": "cal purposes. Given the size of PubTabNet, we adopted its",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 689.2,
"r_x1": 545.1,
"r_y1": 689.2,
"r_x2": 545.1,
"r_y2": 680.3,
"r_x3": 308.9,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "annotation format and we extracted and converted all tables",
"orig": "annotation format and we extracted and converted all tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 308.9,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "as PNG images with a resolution of 72 dpi. Additionally,",
"orig": "as PNG images with a resolution of 72 dpi. Additionally,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 545.1,
"r_y1": 713.2,
"r_x2": 545.1,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "we have filtered out tables with extreme sizes due to small",
"orig": "we have filtered out tables with extreme sizes due to small",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 10,
"label": "text",
"bbox": {
"l": 50.1,
"t": 75.2,
"r": 250.2,
"b": 84.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.1,
"r_x1": 250.2,
"r_y1": 84.1,
"r_x2": 250.2,
"r_y2": 75.2,
"r_x3": 50.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder which is constrained to the table-tags.",
"orig": "tag-decoder which is constrained to the table-tags.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 5,
"label": "text",
"bbox": {
"l": 50.1,
"t": 87.2,
"r": 286.4,
"b": 275.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 96.1,
"r_x1": 70.4,
"r_y1": 96.1,
"r_x2": 70.4,
"r_y2": 87.2,
"r_x3": 62.1,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.9,
"r_y0": 96.1,
"r_x1": 111.0,
"r_y1": 96.1,
"r_x2": 111.0,
"r_y2": 87.2,
"r_x3": 76.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "practice,",
"orig": "practice,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 118.5,
"r_y0": 96.1,
"r_x1": 136.3,
"r_y1": 96.1,
"r_x2": 136.3,
"r_y2": 87.2,
"r_x3": 118.5,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "both",
"orig": "both",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 142.8,
"r_y0": 96.1,
"r_x1": 175.4,
"r_y1": 96.1,
"r_x2": 175.4,
"r_y2": 87.2,
"r_x3": 142.8,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "network",
"orig": "network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 181.9,
"r_y0": 96.1,
"r_x1": 232.8,
"r_y1": 96.1,
"r_x2": 232.8,
"r_y2": 87.2,
"r_x3": 181.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "architectures",
"orig": "architectures",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.4,
"r_y0": 96.1,
"r_x1": 265.4,
"r_y1": 96.1,
"r_x2": 265.4,
"r_y2": 87.2,
"r_x3": 239.4,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "(IETD",
"orig": "(IETD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 272.0,
"r_y0": 96.1,
"r_x1": 286.4,
"r_y1": 96.1,
"r_x2": 286.4,
"r_y2": 87.2,
"r_x3": 272.0,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 108.1,
"r_x1": 286.4,
"r_y1": 108.1,
"r_x2": 286.4,
"r_y2": 99.2,
"r_x3": 50.1,
"r_y3": 99.2,
"coord_origin": "TOPLEFT"
},
"text": "IEDD) require an implicit, custom trained object-character-",
"orig": "IEDD) require an implicit, custom trained object-character-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 120.0,
"r_x1": 286.4,
"r_y1": 120.0,
"r_x2": 286.4,
"r_y2": 111.1,
"r_x3": 50.1,
"r_y3": 111.1,
"coord_origin": "TOPLEFT"
},
"text": "recognition (OCR) to obtain the content of the table-cells.",
"orig": "recognition (OCR) to obtain the content of the table-cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 132.0,
"r_x1": 286.4,
"r_y1": 132.0,
"r_x2": 286.4,
"r_y2": 123.1,
"r_x3": 50.1,
"r_y3": 123.1,
"coord_origin": "TOPLEFT"
},
"text": "In the case of IETD, this OCR engine is implicit in the de-",
"orig": "In the case of IETD, this OCR engine is implicit in the de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 143.9,
"r_x1": 286.4,
"r_y1": 143.9,
"r_x2": 286.4,
"r_y2": 135.0,
"r_x3": 50.1,
"r_y3": 135.0,
"coord_origin": "TOPLEFT"
},
"text": "coder similar to [24]. For the IEDD, the OCR is solely em-",
"orig": "coder similar to [24]. For the IEDD, the OCR is solely em-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 155.9,
"r_x1": 286.4,
"r_y1": 155.9,
"r_x2": 286.4,
"r_y2": 147.0,
"r_x3": 50.1,
"r_y3": 147.0,
"coord_origin": "TOPLEFT"
},
"text": "bedded in the content-decoder. This reliance on a custom,",
"orig": "bedded in the content-decoder. This reliance on a custom,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 167.9,
"r_x1": 286.4,
"r_y1": 167.9,
"r_x2": 286.4,
"r_y2": 159.0,
"r_x3": 50.1,
"r_y3": 159.0,
"coord_origin": "TOPLEFT"
},
"text": "implicit OCR decoder is of course problematic. OCR is a",
"orig": "implicit OCR decoder is of course problematic. OCR is a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 179.8,
"r_x1": 286.4,
"r_y1": 179.8,
"r_x2": 286.4,
"r_y2": 170.9,
"r_x3": 50.1,
"r_y3": 170.9,
"coord_origin": "TOPLEFT"
},
"text": "well known and extremely tough problem, that often needs",
"orig": "well known and extremely tough problem, that often needs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 191.8,
"r_x1": 286.4,
"r_y1": 191.8,
"r_x2": 286.4,
"r_y2": 182.9,
"r_x3": 50.1,
"r_y3": 182.9,
"coord_origin": "TOPLEFT"
},
"text": "custom training for each individual language. However, the",
"orig": "custom training for each individual language. However, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 203.7,
"r_x1": 286.4,
"r_y1": 203.7,
"r_x2": 286.4,
"r_y2": 194.8,
"r_x3": 50.1,
"r_y3": 194.8,
"coord_origin": "TOPLEFT"
},
"text": "limited availability for non-english content in the current",
"orig": "limited availability for non-english content in the current",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 215.7,
"r_x1": 286.4,
"r_y1": 215.7,
"r_x2": 286.4,
"r_y2": 206.8,
"r_x3": 50.1,
"r_y3": 206.8,
"coord_origin": "TOPLEFT"
},
"text": "datasets, makes it impractical to apply the IETD and IEDD",
"orig": "datasets, makes it impractical to apply the IETD and IEDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 227.6,
"r_x1": 286.4,
"r_y1": 227.6,
"r_x2": 286.4,
"r_y2": 218.7,
"r_x3": 50.1,
"r_y3": 218.7,
"coord_origin": "TOPLEFT"
},
"text": "methods on tables with other languages. Additionally, OCR",
"orig": "methods on tables with other languages. Additionally, OCR",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 239.6,
"r_x1": 286.4,
"r_y1": 239.6,
"r_x2": 286.4,
"r_y2": 230.7,
"r_x3": 50.1,
"r_y3": 230.7,
"coord_origin": "TOPLEFT"
},
"text": "can be completely omitted if the tables originate from pro-",
"orig": "can be completely omitted if the tables originate from pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 251.5,
"r_x1": 286.4,
"r_y1": 251.5,
"r_x2": 286.4,
"r_y2": 242.6,
"r_x3": 50.1,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "grammatic PDF documents with known positions of each",
"orig": "grammatic PDF documents with known positions of each",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 263.5,
"r_x1": 286.4,
"r_y1": 263.5,
"r_x2": 286.4,
"r_y2": 254.6,
"r_x3": 50.1,
"r_y3": 254.6,
"coord_origin": "TOPLEFT"
},
"text": "cell. The latter was the inspiration for the work of this pa-",
"orig": "cell. The latter was the inspiration for the work of this pa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 275.5,
"r_x1": 64.8,
"r_y1": 275.5,
"r_x2": 64.8,
"r_y2": 266.5,
"r_x3": 50.1,
"r_y3": 266.5,
"coord_origin": "TOPLEFT"
},
"text": "per.",
"orig": "per.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 0,
"label": "text",
"bbox": {
"l": 50.1,
"t": 278.4,
"r": 286.4,
"b": 490.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 287.4,
"r_x1": 171.6,
"r_y1": 287.4,
"r_x2": 171.6,
"r_y2": 278.4,
"r_x3": 62.1,
"r_y3": 278.4,
"coord_origin": "TOPLEFT"
},
"text": "Graph Neural networks",
"orig": "Graph Neural networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.6,
"r_y0": 287.5,
"r_x1": 174.3,
"r_y1": 287.5,
"r_x2": 174.3,
"r_y2": 278.6,
"r_x3": 171.6,
"r_y3": 278.6,
"coord_origin": "TOPLEFT"
},
"text": ":",
"orig": ":",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.2,
"r_y0": 287.5,
"r_x1": 286.4,
"r_y1": 287.5,
"r_x2": 286.4,
"r_y2": 278.6,
"r_x3": 185.2,
"r_y3": 278.6,
"coord_origin": "TOPLEFT"
},
"text": "Graph Neural networks",
"orig": "Graph Neural networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 299.4,
"r_x1": 286.4,
"r_y1": 299.4,
"r_x2": 286.4,
"r_y2": 290.5,
"r_x3": 50.1,
"r_y3": 290.5,
"coord_origin": "TOPLEFT"
},
"text": "(GNN\u2019s) take a radically different approach to table-",
"orig": "(GNN\u2019s) take a radically different approach to table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 311.4,
"r_x1": 131.2,
"r_y1": 311.4,
"r_x2": 131.2,
"r_y2": 302.5,
"r_x3": 50.1,
"r_y3": 302.5,
"coord_origin": "TOPLEFT"
},
"text": "structure extraction.",
"orig": "structure extraction.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.8,
"r_y0": 311.4,
"r_x1": 286.4,
"r_y1": 311.4,
"r_x2": 286.4,
"r_y2": 302.5,
"r_x3": 138.8,
"r_y3": 302.5,
"coord_origin": "TOPLEFT"
},
"text": "Note that one table cell can consti-",
"orig": "Note that one table cell can consti-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 323.3,
"r_x1": 286.4,
"r_y1": 323.3,
"r_x2": 286.4,
"r_y2": 314.4,
"r_x3": 50.1,
"r_y3": 314.4,
"coord_origin": "TOPLEFT"
},
"text": "tute out of multiple text-cells. To obtain the table-structure,",
"orig": "tute out of multiple text-cells. To obtain the table-structure,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 335.3,
"r_x1": 286.4,
"r_y1": 335.3,
"r_x2": 286.4,
"r_y2": 326.4,
"r_x3": 50.1,
"r_y3": 326.4,
"coord_origin": "TOPLEFT"
},
"text": "one creates an initial graph, where each of the text-cells",
"orig": "one creates an initial graph, where each of the text-cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 347.2,
"r_x1": 286.4,
"r_y1": 347.2,
"r_x2": 286.4,
"r_y2": 338.3,
"r_x3": 50.1,
"r_y3": 338.3,
"coord_origin": "TOPLEFT"
},
"text": "becomes a node in the graph similar to [33, 34, 2]. Each",
"orig": "becomes a node in the graph similar to [33, 34, 2]. Each",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 359.2,
"r_x1": 286.4,
"r_y1": 359.2,
"r_x2": 286.4,
"r_y2": 350.3,
"r_x3": 50.1,
"r_y3": 350.3,
"coord_origin": "TOPLEFT"
},
"text": "node is then associated with en embedding vector coming",
"orig": "node is then associated with en embedding vector coming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 371.2,
"r_x1": 286.4,
"r_y1": 371.2,
"r_x2": 286.4,
"r_y2": 362.2,
"r_x3": 50.1,
"r_y3": 362.2,
"coord_origin": "TOPLEFT"
},
"text": "from the encoded image, its coordinates and the encoded",
"orig": "from the encoded image, its coordinates and the encoded",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 383.1,
"r_x1": 286.4,
"r_y1": 383.1,
"r_x2": 286.4,
"r_y2": 374.2,
"r_x3": 50.1,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "text. Furthermore, nodes that represent adjacent text-cells",
"orig": "text. Furthermore, nodes that represent adjacent text-cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 395.1,
"r_x1": 286.4,
"r_y1": 395.1,
"r_x2": 286.4,
"r_y2": 386.2,
"r_x3": 50.1,
"r_y3": 386.2,
"coord_origin": "TOPLEFT"
},
"text": "are linked. Graph Convolutional Networks (GCN\u2019s) based",
"orig": "are linked. Graph Convolutional Networks (GCN\u2019s) based",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 407.0,
"r_x1": 286.4,
"r_y1": 407.0,
"r_x2": 286.4,
"r_y2": 398.1,
"r_x3": 50.1,
"r_y3": 398.1,
"coord_origin": "TOPLEFT"
},
"text": "methods take the image as an input, but also the position of",
"orig": "methods take the image as an input, but also the position of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 419.0,
"r_x1": 286.4,
"r_y1": 419.0,
"r_x2": 286.4,
"r_y2": 410.1,
"r_x3": 50.1,
"r_y3": 410.1,
"coord_origin": "TOPLEFT"
},
"text": "the text-cells and their content [18]. The purpose of a GCN",
"orig": "the text-cells and their content [18]. The purpose of a GCN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 430.9,
"r_x1": 286.4,
"r_y1": 430.9,
"r_x2": 286.4,
"r_y2": 422.0,
"r_x3": 50.1,
"r_y3": 422.0,
"coord_origin": "TOPLEFT"
},
"text": "is to transform the input graph into a new graph, which re-",
"orig": "is to transform the input graph into a new graph, which re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 442.9,
"r_x1": 198.2,
"r_y1": 442.9,
"r_x2": 198.2,
"r_y2": 434.0,
"r_x3": 50.1,
"r_y3": 434.0,
"coord_origin": "TOPLEFT"
},
"text": "places the old links with new ones.",
"orig": "places the old links with new ones.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 205.9,
"r_y0": 442.9,
"r_x1": 286.4,
"r_y1": 442.9,
"r_x2": 286.4,
"r_y2": 434.0,
"r_x3": 205.9,
"r_y3": 434.0,
"coord_origin": "TOPLEFT"
},
"text": "The new links then",
"orig": "The new links then",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 454.8,
"r_x1": 286.4,
"r_y1": 454.8,
"r_x2": 286.4,
"r_y2": 445.9,
"r_x3": 50.1,
"r_y3": 445.9,
"coord_origin": "TOPLEFT"
},
"text": "represent the table-structure. With this approach, one can",
"orig": "represent the table-structure. With this approach, one can",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 466.8,
"r_x1": 286.4,
"r_y1": 466.8,
"r_x2": 286.4,
"r_y2": 457.9,
"r_x3": 50.1,
"r_y3": 457.9,
"coord_origin": "TOPLEFT"
},
"text": "avoid the need to build custom OCR decoders. However,",
"orig": "avoid the need to build custom OCR decoders. However,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 478.7,
"r_x1": 286.4,
"r_y1": 478.7,
"r_x2": 286.4,
"r_y2": 469.8,
"r_x3": 50.1,
"r_y3": 469.8,
"coord_origin": "TOPLEFT"
},
"text": "the quality of the reconstructed structure is not comparable",
"orig": "the quality of the reconstructed structure is not comparable",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 490.7,
"r_x1": 186.5,
"r_y1": 490.7,
"r_x2": 186.5,
"r_y2": 481.8,
"r_x3": 50.1,
"r_y3": 481.8,
"coord_origin": "TOPLEFT"
},
"text": "to the current state-of-the-art [18].",
"orig": "to the current state-of-the-art [18].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "text",
"bbox": {
"l": 50.1,
"t": 493.7,
"r": 286.4,
"b": 622.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 502.6,
"r_x1": 252.9,
"r_y1": 502.6,
"r_x2": 252.9,
"r_y2": 493.7,
"r_x3": 62.1,
"r_y3": 493.7,
"coord_origin": "TOPLEFT"
},
"text": "Hybrid Deep Learning-Rule-Based approach",
"orig": "Hybrid Deep Learning-Rule-Based approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 252.9,
"r_y0": 502.7,
"r_x1": 286.4,
"r_y1": 502.7,
"r_x2": 286.4,
"r_y2": 493.8,
"r_x3": 252.9,
"r_y3": 493.8,
"coord_origin": "TOPLEFT"
},
"text": ": A pop-",
"orig": ": A pop-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 514.7,
"r_x1": 286.4,
"r_y1": 514.7,
"r_x2": 286.4,
"r_y2": 505.8,
"r_x3": 50.1,
"r_y3": 505.8,
"coord_origin": "TOPLEFT"
},
"text": "ular current model for table-structure identification is the",
"orig": "ular current model for table-structure identification is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 526.6,
"r_x1": 286.4,
"r_y1": 526.6,
"r_x2": 286.4,
"r_y2": 517.7,
"r_x3": 50.1,
"r_y3": 517.7,
"coord_origin": "TOPLEFT"
},
"text": "use of a hybrid Deep Learning-Rule-Based approach similar",
"orig": "use of a hybrid Deep Learning-Rule-Based approach similar",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 538.6,
"r_x1": 286.4,
"r_y1": 538.6,
"r_x2": 286.4,
"r_y2": 529.7,
"r_x3": 50.1,
"r_y3": 529.7,
"coord_origin": "TOPLEFT"
},
"text": "to [27, 29]. In this approach, one first detects the position of",
"orig": "to [27, 29]. In this approach, one first detects the position of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 550.5,
"r_x1": 286.4,
"r_y1": 550.5,
"r_x2": 286.4,
"r_y2": 541.6,
"r_x3": 50.1,
"r_y3": 541.6,
"coord_origin": "TOPLEFT"
},
"text": "the table-cells with object detection (e.g. YoloVx or Mask-",
"orig": "the table-cells with object detection (e.g. YoloVx or Mask-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 562.5,
"r_x1": 286.4,
"r_y1": 562.5,
"r_x2": 286.4,
"r_y2": 553.6,
"r_x3": 50.1,
"r_y3": 553.6,
"coord_origin": "TOPLEFT"
},
"text": "RCNN), then classifies the table into different types (from",
"orig": "RCNN), then classifies the table into different types (from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 574.4,
"r_x1": 286.4,
"r_y1": 574.4,
"r_x2": 286.4,
"r_y2": 565.5,
"r_x3": 50.1,
"r_y3": 565.5,
"coord_origin": "TOPLEFT"
},
"text": "its images) and finally uses different rule-sets to obtain",
"orig": "its images) and finally uses different rule-sets to obtain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 586.4,
"r_x1": 286.4,
"r_y1": 586.4,
"r_x2": 286.4,
"r_y2": 577.5,
"r_x3": 50.1,
"r_y3": 577.5,
"coord_origin": "TOPLEFT"
},
"text": "its table-structure. Currently, this approach achieves state-",
"orig": "its table-structure. Currently, this approach achieves state-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 598.4,
"r_x1": 286.4,
"r_y1": 598.4,
"r_x2": 286.4,
"r_y2": 589.4,
"r_x3": 50.1,
"r_y3": 589.4,
"coord_origin": "TOPLEFT"
},
"text": "of-the-art results, but is not an end-to-end deep-learning",
"orig": "of-the-art results, but is not an end-to-end deep-learning",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 610.3,
"r_x1": 286.4,
"r_y1": 610.3,
"r_x2": 286.4,
"r_y2": 601.4,
"r_x3": 50.1,
"r_y3": 601.4,
"coord_origin": "TOPLEFT"
},
"text": "method. As such, new rules need to be written if different",
"orig": "method. As such, new rules need to be written if different",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 622.3,
"r_x1": 176.0,
"r_y1": 622.3,
"r_x2": 176.0,
"r_y2": 613.4,
"r_x3": 50.1,
"r_y3": 613.4,
"coord_origin": "TOPLEFT"
},
"text": "types of tables are encountered.",
"orig": "types of tables are encountered.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 8,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 635.9,
"r": 105.2,
"b": 646.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 646.7,
"r_x1": 57.8,
"r_y1": 646.7,
"r_x2": 57.8,
"r_y2": 635.9,
"r_x3": 50.1,
"r_y3": 635.9,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.1,
"r_y0": 646.7,
"r_x1": 105.2,
"r_y1": 646.7,
"r_x2": 105.2,
"r_y2": 635.9,
"r_x3": 68.1,
"r_y3": 635.9,
"coord_origin": "TOPLEFT"
},
"text": "Datasets",
"orig": "Datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "text",
"bbox": {
"l": 50.1,
"t": 656.4,
"r": 286.4,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 665.3,
"r_x1": 286.4,
"r_y1": 665.3,
"r_x2": 286.4,
"r_y2": 656.4,
"r_x3": 62.1,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "We rely on large-scale datasets such as PubTabNet [37],",
"orig": "We rely on large-scale datasets such as PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.3,
"r_x1": 286.4,
"r_y1": 677.3,
"r_x2": 286.4,
"r_y2": 668.4,
"r_x3": 50.1,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet [36], and TableBank [17] datasets to train and",
"orig": "FinTabNet [36], and TableBank [17] datasets to train and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 689.2,
"r_x1": 286.4,
"r_y1": 689.2,
"r_x2": 286.4,
"r_y2": 680.3,
"r_x3": 50.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "evaluate our models. These datasets span over various ap-",
"orig": "evaluate our models. These datasets span over various ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 166.2,
"r_y1": 701.2,
"r_x2": 166.2,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "pearance styles and content.",
"orig": "pearance styles and content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 173.7,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 173.7,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "We also introduce our own",
"orig": "We also introduce our own",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 286.4,
"r_y1": 713.2,
"r_x2": 286.4,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "synthetically generated SynthTabNet dataset to fix an im-",
"orig": "synthetically generated SynthTabNet dataset to fix an im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 6,
"label": "picture",
"bbox": {
"l": 312.1,
"t": 78.4,
"r": 550.4,
"b": 250.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 380.8,
"r_y0": 88.6,
"r_x1": 486.8,
"r_y1": 88.6,
"r_x2": 486.8,
"r_y2": 79.8,
"r_x3": 380.8,
"r_y3": 79.8,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet + FinTabNet",
"orig": "PubTabNet + FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.8,
"r_y0": 250.8,
"r_x1": 469.8,
"r_y1": 250.8,
"r_x2": 469.8,
"r_y2": 242.0,
"r_x3": 396.8,
"r_y3": 242.0,
"coord_origin": "TOPLEFT"
},
"text": "Rows / Columns",
"orig": "Rows / Columns",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 321.0,
"r_y0": 239.3,
"r_x1": 324.8,
"r_y1": 239.3,
"r_x2": 324.8,
"r_y2": 233.4,
"r_x3": 321.0,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.5,
"r_y0": 239.3,
"r_x1": 418.1,
"r_y1": 239.3,
"r_x2": 418.1,
"r_y2": 233.4,
"r_x3": 410.5,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.8,
"r_y0": 239.3,
"r_x1": 508.5,
"r_y1": 239.3,
"r_x2": 508.5,
"r_y2": 233.4,
"r_x3": 500.8,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 365.3,
"r_y0": 239.3,
"r_x1": 372.9,
"r_y1": 239.3,
"r_x2": 372.9,
"r_y2": 233.4,
"r_x3": 365.3,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.7,
"r_y0": 239.3,
"r_x1": 463.3,
"r_y1": 239.3,
"r_x2": 463.3,
"r_y2": 233.4,
"r_x3": 455.7,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 542.0,
"r_y0": 239.3,
"r_x1": 549.7,
"r_y1": 239.3,
"r_x2": 549.7,
"r_y2": 233.4,
"r_x3": 542.0,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.0,
"r_y0": 236.3,
"r_x1": 319.9,
"r_y1": 236.3,
"r_x2": 319.9,
"r_y2": 230.4,
"r_x3": 316.0,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.6,
"r_y0": 204.5,
"r_x1": 316.4,
"r_y1": 204.5,
"r_x2": 316.4,
"r_y2": 198.7,
"r_x3": 312.6,
"r_y3": 198.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.4,
"r_y0": 204.5,
"r_x1": 320.3,
"r_y1": 204.5,
"r_x2": 320.3,
"r_y2": 198.7,
"r_x3": 316.4,
"r_y3": 198.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.1,
"r_y0": 173.9,
"r_x1": 317.0,
"r_y1": 173.9,
"r_x2": 317.0,
"r_y2": 168.1,
"r_x3": 313.1,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.0,
"r_y0": 173.9,
"r_x1": 320.8,
"r_y1": 173.9,
"r_x2": 320.8,
"r_y2": 168.1,
"r_x3": 317.0,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.9,
"r_y0": 142.4,
"r_x1": 316.7,
"r_y1": 142.4,
"r_x2": 316.7,
"r_y2": 136.6,
"r_x3": 312.9,
"r_y3": 136.6,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.7,
"r_y0": 142.4,
"r_x1": 320.6,
"r_y1": 142.4,
"r_x2": 320.6,
"r_y2": 136.6,
"r_x3": 316.7,
"r_y3": 136.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.5,
"r_y0": 111.4,
"r_x1": 316.3,
"r_y1": 111.4,
"r_x2": 316.3,
"r_y2": 105.6,
"r_x3": 312.5,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 111.4,
"r_x1": 320.1,
"r_y1": 111.4,
"r_x2": 320.1,
"r_y2": 105.6,
"r_x3": 316.3,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.5,
"r_y0": 218.1,
"r_x1": 316.3,
"r_y1": 218.1,
"r_x2": 316.3,
"r_y2": 212.3,
"r_x3": 312.5,
"r_y3": 212.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 218.1,
"r_x1": 320.1,
"r_y1": 218.1,
"r_x2": 320.1,
"r_y2": 212.3,
"r_x3": 316.3,
"r_y3": 212.3,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.1,
"r_y0": 189.6,
"r_x1": 316.9,
"r_y1": 189.6,
"r_x2": 316.9,
"r_y2": 183.7,
"r_x3": 313.1,
"r_y3": 183.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.9,
"r_y0": 189.6,
"r_x1": 320.7,
"r_y1": 189.6,
"r_x2": 320.7,
"r_y2": 183.7,
"r_x3": 316.9,
"r_y3": 183.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.8,
"r_y0": 158.3,
"r_x1": 316.6,
"r_y1": 158.3,
"r_x2": 316.6,
"r_y2": 152.5,
"r_x3": 312.8,
"r_y3": 152.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.6,
"r_y0": 158.3,
"r_x1": 320.4,
"r_y1": 158.3,
"r_x2": 320.4,
"r_y2": 152.5,
"r_x3": 316.6,
"r_y3": 152.5,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.2,
"r_y0": 126.4,
"r_x1": 316.0,
"r_y1": 126.4,
"r_x2": 316.0,
"r_y2": 120.6,
"r_x3": 312.2,
"r_y3": 120.6,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.0,
"r_y0": 126.4,
"r_x1": 319.8,
"r_y1": 126.4,
"r_x2": 319.8,
"r_y2": 120.6,
"r_x3": 316.0,
"r_y3": 120.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.8,
"r_y0": 95.9,
"r_x1": 316.6,
"r_y1": 95.9,
"r_x2": 316.6,
"r_y2": 90.1,
"r_x3": 312.8,
"r_y3": 90.1,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.6,
"r_y0": 95.9,
"r_x1": 320.4,
"r_y1": 95.9,
"r_x2": 320.4,
"r_y2": 90.1,
"r_x3": 316.6,
"r_y3": 90.1,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.2,
"r_y0": 230.0,
"r_x1": 536.9,
"r_y1": 230.0,
"r_x2": 536.9,
"r_y2": 222.7,
"r_x3": 532.2,
"r_y3": 222.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.9,
"r_y0": 115.6,
"r_x1": 547.6,
"r_y1": 115.6,
"r_x2": 547.6,
"r_y2": 108.3,
"r_x3": 532.9,
"r_y3": 108.3,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.8,
"r_y0": 138.1,
"r_x1": 542.7,
"r_y1": 138.1,
"r_x2": 542.7,
"r_y2": 130.8,
"r_x3": 532.8,
"r_y3": 130.8,
"coord_origin": "TOPLEFT"
},
"text": "8K",
"orig": "8K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.8,
"r_y0": 161.2,
"r_x1": 542.8,
"r_y1": 161.2,
"r_x2": 542.8,
"r_y2": 153.9,
"r_x3": 532.8,
"r_y3": 153.9,
"coord_origin": "TOPLEFT"
},
"text": "6K",
"orig": "6K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.6,
"r_y0": 184.0,
"r_x1": 542.5,
"r_y1": 184.0,
"r_x2": 542.5,
"r_y2": 176.8,
"r_x3": 532.6,
"r_y3": 176.8,
"coord_origin": "TOPLEFT"
},
"text": "4K",
"orig": "4K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.1,
"r_y0": 206.9,
"r_x1": 542.1,
"r_y1": 206.9,
"r_x2": 542.1,
"r_y2": 199.6,
"r_x3": 532.1,
"r_y3": 199.6,
"coord_origin": "TOPLEFT"
},
"text": "2K",
"orig": "2K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 12,
"label": "section_header",
"bbox": {
"l": 380.8,
"t": 79.8,
"r": 486.8,
"b": 88.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.57,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 380.8,
"r_y0": 88.6,
"r_x1": 486.8,
"r_y1": 88.6,
"r_x2": 486.8,
"r_y2": 79.8,
"r_x3": 380.8,
"r_y3": 79.8,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet + FinTabNet",
"orig": "PubTabNet + FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 16,
"label": "text",
"bbox": {
"l": 396.8,
"t": 242.0,
"r": 469.8,
"b": 250.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.8,
"r_y0": 250.8,
"r_x1": 469.8,
"r_y1": 250.8,
"r_x2": 469.8,
"r_y2": 242.0,
"r_x3": 396.8,
"r_y3": 242.0,
"coord_origin": "TOPLEFT"
},
"text": "Rows / Columns",
"orig": "Rows / Columns",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 17,
"label": "text",
"bbox": {
"l": 321.0,
"t": 233.4,
"r": 324.8,
"b": 239.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 321.0,
"r_y0": 239.3,
"r_x1": 324.8,
"r_y1": 239.3,
"r_x2": 324.8,
"r_y2": 233.4,
"r_x3": 321.0,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 18,
"label": "text",
"bbox": {
"l": 410.5,
"t": 233.4,
"r": 418.1,
"b": 239.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.5,
"r_y0": 239.3,
"r_x1": 418.1,
"r_y1": 239.3,
"r_x2": 418.1,
"r_y2": 233.4,
"r_x3": 410.5,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 19,
"label": "text",
"bbox": {
"l": 500.8,
"t": 233.4,
"r": 508.5,
"b": 239.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.8,
"r_y0": 239.3,
"r_x1": 508.5,
"r_y1": 239.3,
"r_x2": 508.5,
"r_y2": 233.4,
"r_x3": 500.8,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 20,
"label": "text",
"bbox": {
"l": 365.3,
"t": 233.4,
"r": 372.9,
"b": 239.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 365.3,
"r_y0": 239.3,
"r_x1": 372.9,
"r_y1": 239.3,
"r_x2": 372.9,
"r_y2": 233.4,
"r_x3": 365.3,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 21,
"label": "text",
"bbox": {
"l": 455.7,
"t": 233.4,
"r": 463.3,
"b": 239.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.7,
"r_y0": 239.3,
"r_x1": 463.3,
"r_y1": 239.3,
"r_x2": 463.3,
"r_y2": 233.4,
"r_x3": 455.7,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 22,
"label": "text",
"bbox": {
"l": 542.0,
"t": 233.4,
"r": 549.7,
"b": 239.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 542.0,
"r_y0": 239.3,
"r_x1": 549.7,
"r_y1": 239.3,
"r_x2": 549.7,
"r_y2": 233.4,
"r_x3": 542.0,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 23,
"label": "text",
"bbox": {
"l": 316.0,
"t": 230.4,
"r": 319.9,
"b": 236.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.0,
"r_y0": 236.3,
"r_x1": 319.9,
"r_y1": 236.3,
"r_x2": 319.9,
"r_y2": 230.4,
"r_x3": 316.0,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 24,
"label": "text",
"bbox": {
"l": 312.6,
"t": 198.7,
"r": 316.4,
"b": 204.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.6,
"r_y0": 204.5,
"r_x1": 316.4,
"r_y1": 204.5,
"r_x2": 316.4,
"r_y2": 198.7,
"r_x3": 312.6,
"r_y3": 198.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 25,
"label": "text",
"bbox": {
"l": 316.4,
"t": 198.7,
"r": 320.3,
"b": 204.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.4,
"r_y0": 204.5,
"r_x1": 320.3,
"r_y1": 204.5,
"r_x2": 320.3,
"r_y2": 198.7,
"r_x3": 316.4,
"r_y3": 198.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 26,
"label": "text",
"bbox": {
"l": 313.1,
"t": 168.1,
"r": 317.0,
"b": 173.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.1,
"r_y0": 173.9,
"r_x1": 317.0,
"r_y1": 173.9,
"r_x2": 317.0,
"r_y2": 168.1,
"r_x3": 313.1,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 27,
"label": "text",
"bbox": {
"l": 317.0,
"t": 168.1,
"r": 320.8,
"b": 173.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.0,
"r_y0": 173.9,
"r_x1": 320.8,
"r_y1": 173.9,
"r_x2": 320.8,
"r_y2": 168.1,
"r_x3": 317.0,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 28,
"label": "text",
"bbox": {
"l": 312.9,
"t": 136.6,
"r": 316.7,
"b": 142.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.9,
"r_y0": 142.4,
"r_x1": 316.7,
"r_y1": 142.4,
"r_x2": 316.7,
"r_y2": 136.6,
"r_x3": 312.9,
"r_y3": 136.6,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "text",
"bbox": {
"l": 316.7,
"t": 136.6,
"r": 320.6,
"b": 142.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.7,
"r_y0": 142.4,
"r_x1": 320.6,
"r_y1": 142.4,
"r_x2": 320.6,
"r_y2": 136.6,
"r_x3": 316.7,
"r_y3": 136.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 30,
"label": "text",
"bbox": {
"l": 312.5,
"t": 105.6,
"r": 316.3,
"b": 111.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.5,
"r_y0": 111.4,
"r_x1": 316.3,
"r_y1": 111.4,
"r_x2": 316.3,
"r_y2": 105.6,
"r_x3": 312.5,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "text",
"bbox": {
"l": 316.3,
"t": 105.6,
"r": 320.1,
"b": 111.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 111.4,
"r_x1": 320.1,
"r_y1": 111.4,
"r_x2": 320.1,
"r_y2": 105.6,
"r_x3": 316.3,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 32,
"label": "text",
"bbox": {
"l": 312.5,
"t": 212.3,
"r": 316.3,
"b": 218.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.5,
"r_y0": 218.1,
"r_x1": 316.3,
"r_y1": 218.1,
"r_x2": 316.3,
"r_y2": 212.3,
"r_x3": 312.5,
"r_y3": 212.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 33,
"label": "text",
"bbox": {
"l": 316.3,
"t": 212.3,
"r": 320.1,
"b": 218.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 218.1,
"r_x1": 320.1,
"r_y1": 218.1,
"r_x2": 320.1,
"r_y2": 212.3,
"r_x3": 316.3,
"r_y3": 212.3,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 34,
"label": "text",
"bbox": {
"l": 313.1,
"t": 183.7,
"r": 316.9,
"b": 189.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.1,
"r_y0": 189.6,
"r_x1": 316.9,
"r_y1": 189.6,
"r_x2": 316.9,
"r_y2": 183.7,
"r_x3": 313.1,
"r_y3": 183.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 35,
"label": "text",
"bbox": {
"l": 316.9,
"t": 183.7,
"r": 320.7,
"b": 189.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.9,
"r_y0": 189.6,
"r_x1": 320.7,
"r_y1": 189.6,
"r_x2": 320.7,
"r_y2": 183.7,
"r_x3": 316.9,
"r_y3": 183.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 36,
"label": "text",
"bbox": {
"l": 312.8,
"t": 152.5,
"r": 316.6,
"b": 158.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.8,
"r_y0": 158.3,
"r_x1": 316.6,
"r_y1": 158.3,
"r_x2": 316.6,
"r_y2": 152.5,
"r_x3": 312.8,
"r_y3": 152.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 37,
"label": "text",
"bbox": {
"l": 316.6,
"t": 152.5,
"r": 320.4,
"b": 158.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.6,
"r_y0": 158.3,
"r_x1": 320.4,
"r_y1": 158.3,
"r_x2": 320.4,
"r_y2": 152.5,
"r_x3": 316.6,
"r_y3": 152.5,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 38,
"label": "text",
"bbox": {
"l": 312.2,
"t": 120.6,
"r": 316.0,
"b": 126.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.2,
"r_y0": 126.4,
"r_x1": 316.0,
"r_y1": 126.4,
"r_x2": 316.0,
"r_y2": 120.6,
"r_x3": 312.2,
"r_y3": 120.6,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 39,
"label": "text",
"bbox": {
"l": 316.0,
"t": 120.6,
"r": 319.8,
"b": 126.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.0,
"r_y0": 126.4,
"r_x1": 319.8,
"r_y1": 126.4,
"r_x2": 319.8,
"r_y2": 120.6,
"r_x3": 316.0,
"r_y3": 120.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 40,
"label": "text",
"bbox": {
"l": 312.8,
"t": 90.1,
"r": 316.6,
"b": 95.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.8,
"r_y0": 95.9,
"r_x1": 316.6,
"r_y1": 95.9,
"r_x2": 316.6,
"r_y2": 90.1,
"r_x3": 312.8,
"r_y3": 90.1,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 316.6,
"t": 90.1,
"r": 320.4,
"b": 95.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.6,
"r_y0": 95.9,
"r_x1": 320.4,
"r_y1": 95.9,
"r_x2": 320.4,
"r_y2": 90.1,
"r_x3": 316.6,
"r_y3": 90.1,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 532.2,
"t": 222.7,
"r": 536.9,
"b": 230.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.2,
"r_y0": 230.0,
"r_x1": 536.9,
"r_y1": 230.0,
"r_x2": 536.9,
"r_y2": 222.7,
"r_x3": 532.2,
"r_y3": 222.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 532.9,
"t": 108.3,
"r": 547.6,
"b": 115.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.9,
"r_y0": 115.6,
"r_x1": 547.6,
"r_y1": 115.6,
"r_x2": 547.6,
"r_y2": 108.3,
"r_x3": 532.9,
"r_y3": 108.3,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 532.8,
"t": 130.8,
"r": 542.7,
"b": 138.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.8,
"r_y0": 138.1,
"r_x1": 542.7,
"r_y1": 138.1,
"r_x2": 542.7,
"r_y2": 130.8,
"r_x3": 532.8,
"r_y3": 130.8,
"coord_origin": "TOPLEFT"
},
"text": "8K",
"orig": "8K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 532.8,
"t": 153.9,
"r": 542.8,
"b": 161.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.8,
"r_y0": 161.2,
"r_x1": 542.8,
"r_y1": 161.2,
"r_x2": 542.8,
"r_y2": 153.9,
"r_x3": 532.8,
"r_y3": 153.9,
"coord_origin": "TOPLEFT"
},
"text": "6K",
"orig": "6K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 532.6,
"t": 176.8,
"r": 542.5,
"b": 184.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.6,
"r_y0": 184.0,
"r_x1": 542.5,
"r_y1": 184.0,
"r_x2": 542.5,
"r_y2": 176.8,
"r_x3": 532.6,
"r_y3": 176.8,
"coord_origin": "TOPLEFT"
},
"text": "4K",
"orig": "4K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 532.1,
"t": 199.6,
"r": 542.1,
"b": 206.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.1,
"r_y0": 206.9,
"r_x1": 542.1,
"r_y1": 206.9,
"r_x2": 542.1,
"r_y2": 199.6,
"r_x3": 532.1,
"r_y3": 199.6,
"coord_origin": "TOPLEFT"
},
"text": "2K",
"orig": "2K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 7,
"label": "caption",
"bbox": {
"l": 308.9,
"t": 267.8,
"r": 545.1,
"b": 288.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 276.7,
"r_x1": 346.1,
"r_y1": 276.7,
"r_x2": 346.1,
"r_y2": 267.8,
"r_x3": 308.9,
"r_y3": 267.8,
"coord_origin": "TOPLEFT"
},
"text": "Figure 2:",
"orig": "Figure 2:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.5,
"r_y0": 276.7,
"r_x1": 545.1,
"r_y1": 276.7,
"r_x2": 545.1,
"r_y2": 267.8,
"r_x3": 354.5,
"r_y3": 267.8,
"coord_origin": "TOPLEFT"
},
"text": "Distribution of the tables across different table",
"orig": "Distribution of the tables across different table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 288.7,
"r_x1": 498.6,
"r_y1": 288.7,
"r_x2": 498.6,
"r_y2": 279.8,
"r_x3": 308.9,
"r_y3": 279.8,
"coord_origin": "TOPLEFT"
},
"text": "dimensions in PubTabNet + FinTabNet datasets",
"orig": "dimensions in PubTabNet + FinTabNet datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 9,
"label": "text",
"bbox": {
"l": 308.9,
"t": 317.5,
"r": 437.3,
"b": 326.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 326.4,
"r_x1": 437.3,
"r_y1": 326.4,
"r_x2": 437.3,
"r_y2": 317.5,
"r_x3": 308.9,
"r_y3": 317.5,
"coord_origin": "TOPLEFT"
},
"text": "balance in the previous datasets.",
"orig": "balance in the previous datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "text",
"bbox": {
"l": 308.9,
"t": 331.5,
"r": 545.1,
"b": 627.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 340.4,
"r_x1": 545.1,
"r_y1": 340.4,
"r_x2": 545.1,
"r_y2": 331.5,
"r_x3": 320.8,
"r_y3": 331.5,
"coord_origin": "TOPLEFT"
},
"text": "The PubTabNet dataset contains 509k tables delivered as",
"orig": "The PubTabNet dataset contains 509k tables delivered as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 352.4,
"r_x1": 545.1,
"r_y1": 352.4,
"r_x2": 545.1,
"r_y2": 343.5,
"r_x3": 308.9,
"r_y3": 343.5,
"coord_origin": "TOPLEFT"
},
"text": "annotated PNG images. The annotations consist of the table",
"orig": "annotated PNG images. The annotations consist of the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 364.3,
"r_x1": 545.1,
"r_y1": 364.3,
"r_x2": 545.1,
"r_y2": 355.4,
"r_x3": 308.9,
"r_y3": 355.4,
"coord_origin": "TOPLEFT"
},
"text": "structure represented in HTML format, the tokenized text",
"orig": "structure represented in HTML format, the tokenized text",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 376.3,
"r_x1": 545.1,
"r_y1": 376.3,
"r_x2": 545.1,
"r_y2": 367.4,
"r_x3": 308.9,
"r_y3": 367.4,
"coord_origin": "TOPLEFT"
},
"text": "and its bounding boxes per table cell. Fig. 1 shows the ap-",
"orig": "and its bounding boxes per table cell. Fig. 1 shows the ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 388.3,
"r_x1": 545.1,
"r_y1": 388.3,
"r_x2": 545.1,
"r_y2": 379.4,
"r_x3": 308.9,
"r_y3": 379.4,
"coord_origin": "TOPLEFT"
},
"text": "pearance style of PubTabNet. Depending on its complexity,",
"orig": "pearance style of PubTabNet. Depending on its complexity,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 400.2,
"r_x1": 545.1,
"r_y1": 400.2,
"r_x2": 545.1,
"r_y2": 391.3,
"r_x3": 308.9,
"r_y3": 391.3,
"coord_origin": "TOPLEFT"
},
"text": "a table is characterized as \u201csimple\u201d when it does not contain",
"orig": "a table is characterized as \u201csimple\u201d when it does not contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 412.2,
"r_x1": 545.1,
"r_y1": 412.2,
"r_x2": 545.1,
"r_y2": 403.3,
"r_x3": 308.9,
"r_y3": 403.3,
"coord_origin": "TOPLEFT"
},
"text": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The",
"orig": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 424.1,
"r_x1": 545.1,
"r_y1": 424.1,
"r_x2": 545.1,
"r_y2": 415.2,
"r_x3": 308.9,
"r_y3": 415.2,
"coord_origin": "TOPLEFT"
},
"text": "dataset is divided into Train and Val splits (roughly 98% and",
"orig": "dataset is divided into Train and Val splits (roughly 98% and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 436.1,
"r_x1": 545.1,
"r_y1": 436.1,
"r_x2": 545.1,
"r_y2": 427.2,
"r_x3": 308.9,
"r_y3": 427.2,
"coord_origin": "TOPLEFT"
},
"text": "2%). The Train split consists of 54% simple and 46% com-",
"orig": "2%). The Train split consists of 54% simple and 46% com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 448.0,
"r_x1": 545.1,
"r_y1": 448.0,
"r_x2": 545.1,
"r_y2": 439.1,
"r_x3": 308.9,
"r_y3": 439.1,
"coord_origin": "TOPLEFT"
},
"text": "plex tables and the Val split of 51% and 49% respectively.",
"orig": "plex tables and the Val split of 51% and 49% respectively.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 460.0,
"r_x1": 545.1,
"r_y1": 460.0,
"r_x2": 545.1,
"r_y2": 451.1,
"r_x3": 308.9,
"r_y3": 451.1,
"coord_origin": "TOPLEFT"
},
"text": "The FinTabNet dataset contains 112k tables delivered as",
"orig": "The FinTabNet dataset contains 112k tables delivered as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 471.9,
"r_x1": 545.1,
"r_y1": 471.9,
"r_x2": 545.1,
"r_y2": 463.0,
"r_x3": 308.9,
"r_y3": 463.0,
"coord_origin": "TOPLEFT"
},
"text": "single-page PDF documents with mixed table structures and",
"orig": "single-page PDF documents with mixed table structures and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 483.9,
"r_x1": 545.1,
"r_y1": 483.9,
"r_x2": 545.1,
"r_y2": 475.0,
"r_x3": 308.9,
"r_y3": 475.0,
"coord_origin": "TOPLEFT"
},
"text": "text content. Similarly to the PubTabNet, the annotations",
"orig": "text content. Similarly to the PubTabNet, the annotations",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 495.9,
"r_x1": 545.1,
"r_y1": 495.9,
"r_x2": 545.1,
"r_y2": 486.9,
"r_x3": 308.9,
"r_y3": 486.9,
"coord_origin": "TOPLEFT"
},
"text": "of FinTabNet include the table structure in HTML, the to-",
"orig": "of FinTabNet include the table structure in HTML, the to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 507.8,
"r_x1": 545.1,
"r_y1": 507.8,
"r_x2": 545.1,
"r_y2": 498.9,
"r_x3": 308.9,
"r_y3": 498.9,
"coord_origin": "TOPLEFT"
},
"text": "kenized text and the bounding boxes on a table cell basis.",
"orig": "kenized text and the bounding boxes on a table cell basis.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 519.8,
"r_x1": 545.1,
"r_y1": 519.8,
"r_x2": 545.1,
"r_y2": 510.9,
"r_x3": 308.9,
"r_y3": 510.9,
"coord_origin": "TOPLEFT"
},
"text": "The dataset is divided into Train, Test and Val splits (81%,",
"orig": "The dataset is divided into Train, Test and Val splits (81%,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 531.7,
"r_x1": 545.1,
"r_y1": 531.7,
"r_x2": 545.1,
"r_y2": 522.8,
"r_x3": 308.9,
"r_y3": 522.8,
"coord_origin": "TOPLEFT"
},
"text": "9.5%, 9.5%), and each one is almost equally divided into",
"orig": "9.5%, 9.5%), and each one is almost equally divided into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 543.7,
"r_x1": 545.1,
"r_y1": 543.7,
"r_x2": 545.1,
"r_y2": 534.8,
"r_x3": 308.9,
"r_y3": 534.8,
"coord_origin": "TOPLEFT"
},
"text": "simple and complex tables (Train: 48% simple, 52% com-",
"orig": "simple and complex tables (Train: 48% simple, 52% com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 555.6,
"r_x1": 545.1,
"r_y1": 555.6,
"r_x2": 545.1,
"r_y2": 546.7,
"r_x3": 308.9,
"r_y3": 546.7,
"coord_origin": "TOPLEFT"
},
"text": "plex, Test: 48% simple, 52% complex, Test: 53% simple,",
"orig": "plex, Test: 48% simple, 52% complex, Test: 53% simple,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 567.6,
"r_x1": 545.1,
"r_y1": 567.6,
"r_x2": 545.1,
"r_y2": 558.7,
"r_x3": 308.9,
"r_y3": 558.7,
"coord_origin": "TOPLEFT"
},
"text": "47% complex). Finally the TableBank dataset consists of",
"orig": "47% complex). Finally the TableBank dataset consists of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 579.5,
"r_x1": 545.1,
"r_y1": 579.5,
"r_x2": 545.1,
"r_y2": 570.6,
"r_x3": 308.9,
"r_y3": 570.6,
"coord_origin": "TOPLEFT"
},
"text": "145k tables provided as JPEG images. The latter has anno-",
"orig": "145k tables provided as JPEG images. The latter has anno-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 591.5,
"r_x1": 545.1,
"r_y1": 591.5,
"r_x2": 545.1,
"r_y2": 582.6,
"r_x3": 308.9,
"r_y3": 582.6,
"coord_origin": "TOPLEFT"
},
"text": "tations for the table structure, but only few with bounding",
"orig": "tations for the table structure, but only few with bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 603.5,
"r_x1": 545.1,
"r_y1": 603.5,
"r_x2": 545.1,
"r_y2": 594.5,
"r_x3": 308.9,
"r_y3": 594.5,
"coord_origin": "TOPLEFT"
},
"text": "boxes of the table cells. The entire dataset consists of sim-",
"orig": "boxes of the table cells. The entire dataset consists of sim-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 615.4,
"r_x1": 545.1,
"r_y1": 615.4,
"r_x2": 545.1,
"r_y2": 606.5,
"r_x3": 308.9,
"r_y3": 606.5,
"coord_origin": "TOPLEFT"
},
"text": "ple tables and it is divided into 90% Train, 3% Test and 7%",
"orig": "ple tables and it is divided into 90% Train, 3% Test and 7%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 627.4,
"r_x1": 348.2,
"r_y1": 627.4,
"r_x2": 348.2,
"r_y2": 618.5,
"r_x3": 308.9,
"r_y3": 618.5,
"coord_origin": "TOPLEFT"
},
"text": "Val splits.",
"orig": "Val splits.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "text",
"bbox": {
"l": 308.9,
"t": 632.5,
"r": 545.1,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 641.4,
"r_x1": 545.1,
"r_y1": 641.4,
"r_x2": 545.1,
"r_y2": 632.5,
"r_x3": 320.8,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": "Due to the heterogeneity across the dataset formats, it",
"orig": "Due to the heterogeneity across the dataset formats, it",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 653.4,
"r_x1": 545.1,
"r_y1": 653.4,
"r_x2": 545.1,
"r_y2": 644.5,
"r_x3": 308.9,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "was necessary to combine all available data into one homog-",
"orig": "was necessary to combine all available data into one homog-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 665.3,
"r_x1": 545.1,
"r_y1": 665.3,
"r_x2": 545.1,
"r_y2": 656.4,
"r_x3": 308.9,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "enized dataset before we could train our models for practi-",
"orig": "enized dataset before we could train our models for practi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 677.3,
"r_x1": 545.1,
"r_y1": 677.3,
"r_x2": 545.1,
"r_y2": 668.4,
"r_x3": 308.9,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "cal purposes. Given the size of PubTabNet, we adopted its",
"orig": "cal purposes. Given the size of PubTabNet, we adopted its",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 689.2,
"r_x1": 545.1,
"r_y1": 689.2,
"r_x2": 545.1,
"r_y2": 680.3,
"r_x3": 308.9,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "annotation format and we extracted and converted all tables",
"orig": "annotation format and we extracted and converted all tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 308.9,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "as PNG images with a resolution of 72 dpi. Additionally,",
"orig": "as PNG images with a resolution of 72 dpi. Additionally,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 545.1,
"r_y1": 713.2,
"r_x2": 545.1,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "we have filtered out tables with extreme sizes due to small",
"orig": "we have filtered out tables with extreme sizes due to small",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 11,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.87,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"tablestructure": {
"table_map": {}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "text",
"id": 10,
"page_no": 2,
"cluster": {
"id": 10,
"label": "text",
"bbox": {
"l": 50.1,
"t": 75.2,
"r": 250.2,
"b": 84.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.1,
"r_x1": 250.2,
"r_y1": 84.1,
"r_x2": 250.2,
"r_y2": 75.2,
"r_x3": 50.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder which is constrained to the table-tags.",
"orig": "tag-decoder which is constrained to the table-tags.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "tag-decoder which is constrained to the table-tags."
},
{
"label": "text",
"id": 5,
"page_no": 2,
"cluster": {
"id": 5,
"label": "text",
"bbox": {
"l": 50.1,
"t": 87.2,
"r": 286.4,
"b": 275.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 96.1,
"r_x1": 70.4,
"r_y1": 96.1,
"r_x2": 70.4,
"r_y2": 87.2,
"r_x3": 62.1,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.9,
"r_y0": 96.1,
"r_x1": 111.0,
"r_y1": 96.1,
"r_x2": 111.0,
"r_y2": 87.2,
"r_x3": 76.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "practice,",
"orig": "practice,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 118.5,
"r_y0": 96.1,
"r_x1": 136.3,
"r_y1": 96.1,
"r_x2": 136.3,
"r_y2": 87.2,
"r_x3": 118.5,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "both",
"orig": "both",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 142.8,
"r_y0": 96.1,
"r_x1": 175.4,
"r_y1": 96.1,
"r_x2": 175.4,
"r_y2": 87.2,
"r_x3": 142.8,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "network",
"orig": "network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 181.9,
"r_y0": 96.1,
"r_x1": 232.8,
"r_y1": 96.1,
"r_x2": 232.8,
"r_y2": 87.2,
"r_x3": 181.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "architectures",
"orig": "architectures",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.4,
"r_y0": 96.1,
"r_x1": 265.4,
"r_y1": 96.1,
"r_x2": 265.4,
"r_y2": 87.2,
"r_x3": 239.4,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "(IETD",
"orig": "(IETD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 272.0,
"r_y0": 96.1,
"r_x1": 286.4,
"r_y1": 96.1,
"r_x2": 286.4,
"r_y2": 87.2,
"r_x3": 272.0,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 108.1,
"r_x1": 286.4,
"r_y1": 108.1,
"r_x2": 286.4,
"r_y2": 99.2,
"r_x3": 50.1,
"r_y3": 99.2,
"coord_origin": "TOPLEFT"
},
"text": "IEDD) require an implicit, custom trained object-character-",
"orig": "IEDD) require an implicit, custom trained object-character-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 120.0,
"r_x1": 286.4,
"r_y1": 120.0,
"r_x2": 286.4,
"r_y2": 111.1,
"r_x3": 50.1,
"r_y3": 111.1,
"coord_origin": "TOPLEFT"
},
"text": "recognition (OCR) to obtain the content of the table-cells.",
"orig": "recognition (OCR) to obtain the content of the table-cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 132.0,
"r_x1": 286.4,
"r_y1": 132.0,
"r_x2": 286.4,
"r_y2": 123.1,
"r_x3": 50.1,
"r_y3": 123.1,
"coord_origin": "TOPLEFT"
},
"text": "In the case of IETD, this OCR engine is implicit in the de-",
"orig": "In the case of IETD, this OCR engine is implicit in the de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 143.9,
"r_x1": 286.4,
"r_y1": 143.9,
"r_x2": 286.4,
"r_y2": 135.0,
"r_x3": 50.1,
"r_y3": 135.0,
"coord_origin": "TOPLEFT"
},
"text": "coder similar to [24]. For the IEDD, the OCR is solely em-",
"orig": "coder similar to [24]. For the IEDD, the OCR is solely em-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 155.9,
"r_x1": 286.4,
"r_y1": 155.9,
"r_x2": 286.4,
"r_y2": 147.0,
"r_x3": 50.1,
"r_y3": 147.0,
"coord_origin": "TOPLEFT"
},
"text": "bedded in the content-decoder. This reliance on a custom,",
"orig": "bedded in the content-decoder. This reliance on a custom,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 167.9,
"r_x1": 286.4,
"r_y1": 167.9,
"r_x2": 286.4,
"r_y2": 159.0,
"r_x3": 50.1,
"r_y3": 159.0,
"coord_origin": "TOPLEFT"
},
"text": "implicit OCR decoder is of course problematic. OCR is a",
"orig": "implicit OCR decoder is of course problematic. OCR is a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 179.8,
"r_x1": 286.4,
"r_y1": 179.8,
"r_x2": 286.4,
"r_y2": 170.9,
"r_x3": 50.1,
"r_y3": 170.9,
"coord_origin": "TOPLEFT"
},
"text": "well known and extremely tough problem, that often needs",
"orig": "well known and extremely tough problem, that often needs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 191.8,
"r_x1": 286.4,
"r_y1": 191.8,
"r_x2": 286.4,
"r_y2": 182.9,
"r_x3": 50.1,
"r_y3": 182.9,
"coord_origin": "TOPLEFT"
},
"text": "custom training for each individual language. However, the",
"orig": "custom training for each individual language. However, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 203.7,
"r_x1": 286.4,
"r_y1": 203.7,
"r_x2": 286.4,
"r_y2": 194.8,
"r_x3": 50.1,
"r_y3": 194.8,
"coord_origin": "TOPLEFT"
},
"text": "limited availability for non-english content in the current",
"orig": "limited availability for non-english content in the current",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 215.7,
"r_x1": 286.4,
"r_y1": 215.7,
"r_x2": 286.4,
"r_y2": 206.8,
"r_x3": 50.1,
"r_y3": 206.8,
"coord_origin": "TOPLEFT"
},
"text": "datasets, makes it impractical to apply the IETD and IEDD",
"orig": "datasets, makes it impractical to apply the IETD and IEDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 227.6,
"r_x1": 286.4,
"r_y1": 227.6,
"r_x2": 286.4,
"r_y2": 218.7,
"r_x3": 50.1,
"r_y3": 218.7,
"coord_origin": "TOPLEFT"
},
"text": "methods on tables with other languages. Additionally, OCR",
"orig": "methods on tables with other languages. Additionally, OCR",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 239.6,
"r_x1": 286.4,
"r_y1": 239.6,
"r_x2": 286.4,
"r_y2": 230.7,
"r_x3": 50.1,
"r_y3": 230.7,
"coord_origin": "TOPLEFT"
},
"text": "can be completely omitted if the tables originate from pro-",
"orig": "can be completely omitted if the tables originate from pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 251.5,
"r_x1": 286.4,
"r_y1": 251.5,
"r_x2": 286.4,
"r_y2": 242.6,
"r_x3": 50.1,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "grammatic PDF documents with known positions of each",
"orig": "grammatic PDF documents with known positions of each",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 263.5,
"r_x1": 286.4,
"r_y1": 263.5,
"r_x2": 286.4,
"r_y2": 254.6,
"r_x3": 50.1,
"r_y3": 254.6,
"coord_origin": "TOPLEFT"
},
"text": "cell. The latter was the inspiration for the work of this pa-",
"orig": "cell. The latter was the inspiration for the work of this pa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 275.5,
"r_x1": 64.8,
"r_y1": 275.5,
"r_x2": 64.8,
"r_y2": 266.5,
"r_x3": 50.1,
"r_y3": 266.5,
"coord_origin": "TOPLEFT"
},
"text": "per.",
"orig": "per.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "In practice, both network architectures (IETD and IEDD) require an implicit, custom trained object-characterrecognition (OCR) to obtain the content of the table-cells. In the case of IETD, this OCR engine is implicit in the decoder similar to [24]. For the IEDD, the OCR is solely embedded in the content-decoder. This reliance on a custom, implicit OCR decoder is of course problematic. OCR is a well known and extremely tough problem, that often needs custom training for each individual language. However, the limited availability for non-english content in the current datasets, makes it impractical to apply the IETD and IEDD methods on tables with other languages. Additionally, OCR can be completely omitted if the tables originate from programmatic PDF documents with known positions of each cell. The latter was the inspiration for the work of this paper."
},
{
"label": "text",
"id": 0,
"page_no": 2,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 50.1,
"t": 278.4,
"r": 286.4,
"b": 490.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 287.4,
"r_x1": 171.6,
"r_y1": 287.4,
"r_x2": 171.6,
"r_y2": 278.4,
"r_x3": 62.1,
"r_y3": 278.4,
"coord_origin": "TOPLEFT"
},
"text": "Graph Neural networks",
"orig": "Graph Neural networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.6,
"r_y0": 287.5,
"r_x1": 174.3,
"r_y1": 287.5,
"r_x2": 174.3,
"r_y2": 278.6,
"r_x3": 171.6,
"r_y3": 278.6,
"coord_origin": "TOPLEFT"
},
"text": ":",
"orig": ":",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.2,
"r_y0": 287.5,
"r_x1": 286.4,
"r_y1": 287.5,
"r_x2": 286.4,
"r_y2": 278.6,
"r_x3": 185.2,
"r_y3": 278.6,
"coord_origin": "TOPLEFT"
},
"text": "Graph Neural networks",
"orig": "Graph Neural networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 299.4,
"r_x1": 286.4,
"r_y1": 299.4,
"r_x2": 286.4,
"r_y2": 290.5,
"r_x3": 50.1,
"r_y3": 290.5,
"coord_origin": "TOPLEFT"
},
"text": "(GNN\u2019s) take a radically different approach to table-",
"orig": "(GNN\u2019s) take a radically different approach to table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 311.4,
"r_x1": 131.2,
"r_y1": 311.4,
"r_x2": 131.2,
"r_y2": 302.5,
"r_x3": 50.1,
"r_y3": 302.5,
"coord_origin": "TOPLEFT"
},
"text": "structure extraction.",
"orig": "structure extraction.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.8,
"r_y0": 311.4,
"r_x1": 286.4,
"r_y1": 311.4,
"r_x2": 286.4,
"r_y2": 302.5,
"r_x3": 138.8,
"r_y3": 302.5,
"coord_origin": "TOPLEFT"
},
"text": "Note that one table cell can consti-",
"orig": "Note that one table cell can consti-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 323.3,
"r_x1": 286.4,
"r_y1": 323.3,
"r_x2": 286.4,
"r_y2": 314.4,
"r_x3": 50.1,
"r_y3": 314.4,
"coord_origin": "TOPLEFT"
},
"text": "tute out of multiple text-cells. To obtain the table-structure,",
"orig": "tute out of multiple text-cells. To obtain the table-structure,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 335.3,
"r_x1": 286.4,
"r_y1": 335.3,
"r_x2": 286.4,
"r_y2": 326.4,
"r_x3": 50.1,
"r_y3": 326.4,
"coord_origin": "TOPLEFT"
},
"text": "one creates an initial graph, where each of the text-cells",
"orig": "one creates an initial graph, where each of the text-cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 347.2,
"r_x1": 286.4,
"r_y1": 347.2,
"r_x2": 286.4,
"r_y2": 338.3,
"r_x3": 50.1,
"r_y3": 338.3,
"coord_origin": "TOPLEFT"
},
"text": "becomes a node in the graph similar to [33, 34, 2]. Each",
"orig": "becomes a node in the graph similar to [33, 34, 2]. Each",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 359.2,
"r_x1": 286.4,
"r_y1": 359.2,
"r_x2": 286.4,
"r_y2": 350.3,
"r_x3": 50.1,
"r_y3": 350.3,
"coord_origin": "TOPLEFT"
},
"text": "node is then associated with en embedding vector coming",
"orig": "node is then associated with en embedding vector coming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 371.2,
"r_x1": 286.4,
"r_y1": 371.2,
"r_x2": 286.4,
"r_y2": 362.2,
"r_x3": 50.1,
"r_y3": 362.2,
"coord_origin": "TOPLEFT"
},
"text": "from the encoded image, its coordinates and the encoded",
"orig": "from the encoded image, its coordinates and the encoded",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 383.1,
"r_x1": 286.4,
"r_y1": 383.1,
"r_x2": 286.4,
"r_y2": 374.2,
"r_x3": 50.1,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "text. Furthermore, nodes that represent adjacent text-cells",
"orig": "text. Furthermore, nodes that represent adjacent text-cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 395.1,
"r_x1": 286.4,
"r_y1": 395.1,
"r_x2": 286.4,
"r_y2": 386.2,
"r_x3": 50.1,
"r_y3": 386.2,
"coord_origin": "TOPLEFT"
},
"text": "are linked. Graph Convolutional Networks (GCN\u2019s) based",
"orig": "are linked. Graph Convolutional Networks (GCN\u2019s) based",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 407.0,
"r_x1": 286.4,
"r_y1": 407.0,
"r_x2": 286.4,
"r_y2": 398.1,
"r_x3": 50.1,
"r_y3": 398.1,
"coord_origin": "TOPLEFT"
},
"text": "methods take the image as an input, but also the position of",
"orig": "methods take the image as an input, but also the position of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 419.0,
"r_x1": 286.4,
"r_y1": 419.0,
"r_x2": 286.4,
"r_y2": 410.1,
"r_x3": 50.1,
"r_y3": 410.1,
"coord_origin": "TOPLEFT"
},
"text": "the text-cells and their content [18]. The purpose of a GCN",
"orig": "the text-cells and their content [18]. The purpose of a GCN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 430.9,
"r_x1": 286.4,
"r_y1": 430.9,
"r_x2": 286.4,
"r_y2": 422.0,
"r_x3": 50.1,
"r_y3": 422.0,
"coord_origin": "TOPLEFT"
},
"text": "is to transform the input graph into a new graph, which re-",
"orig": "is to transform the input graph into a new graph, which re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 442.9,
"r_x1": 198.2,
"r_y1": 442.9,
"r_x2": 198.2,
"r_y2": 434.0,
"r_x3": 50.1,
"r_y3": 434.0,
"coord_origin": "TOPLEFT"
},
"text": "places the old links with new ones.",
"orig": "places the old links with new ones.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 205.9,
"r_y0": 442.9,
"r_x1": 286.4,
"r_y1": 442.9,
"r_x2": 286.4,
"r_y2": 434.0,
"r_x3": 205.9,
"r_y3": 434.0,
"coord_origin": "TOPLEFT"
},
"text": "The new links then",
"orig": "The new links then",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 454.8,
"r_x1": 286.4,
"r_y1": 454.8,
"r_x2": 286.4,
"r_y2": 445.9,
"r_x3": 50.1,
"r_y3": 445.9,
"coord_origin": "TOPLEFT"
},
"text": "represent the table-structure. With this approach, one can",
"orig": "represent the table-structure. With this approach, one can",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 466.8,
"r_x1": 286.4,
"r_y1": 466.8,
"r_x2": 286.4,
"r_y2": 457.9,
"r_x3": 50.1,
"r_y3": 457.9,
"coord_origin": "TOPLEFT"
},
"text": "avoid the need to build custom OCR decoders. However,",
"orig": "avoid the need to build custom OCR decoders. However,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 478.7,
"r_x1": 286.4,
"r_y1": 478.7,
"r_x2": 286.4,
"r_y2": 469.8,
"r_x3": 50.1,
"r_y3": 469.8,
"coord_origin": "TOPLEFT"
},
"text": "the quality of the reconstructed structure is not comparable",
"orig": "the quality of the reconstructed structure is not comparable",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 490.7,
"r_x1": 186.5,
"r_y1": 490.7,
"r_x2": 186.5,
"r_y2": 481.8,
"r_x3": 50.1,
"r_y3": 481.8,
"coord_origin": "TOPLEFT"
},
"text": "to the current state-of-the-art [18].",
"orig": "to the current state-of-the-art [18].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Graph Neural networks : Graph Neural networks (GNN's) take a radically different approach to tablestructure extraction. Note that one table cell can constitute out of multiple text-cells. To obtain the table-structure, one creates an initial graph, where each of the text-cells becomes a node in the graph similar to [33, 34, 2]. Each node is then associated with en embedding vector coming from the encoded image, its coordinates and the encoded text. Furthermore, nodes that represent adjacent text-cells are linked. Graph Convolutional Networks (GCN's) based methods take the image as an input, but also the position of the text-cells and their content [18]. The purpose of a GCN is to transform the input graph into a new graph, which replaces the old links with new ones. The new links then represent the table-structure. With this approach, one can avoid the need to build custom OCR decoders. However, the quality of the reconstructed structure is not comparable to the current state-of-the-art [18]."
},
{
"label": "text",
"id": 1,
"page_no": 2,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.1,
"t": 493.7,
"r": 286.4,
"b": 622.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 502.6,
"r_x1": 252.9,
"r_y1": 502.6,
"r_x2": 252.9,
"r_y2": 493.7,
"r_x3": 62.1,
"r_y3": 493.7,
"coord_origin": "TOPLEFT"
},
"text": "Hybrid Deep Learning-Rule-Based approach",
"orig": "Hybrid Deep Learning-Rule-Based approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 252.9,
"r_y0": 502.7,
"r_x1": 286.4,
"r_y1": 502.7,
"r_x2": 286.4,
"r_y2": 493.8,
"r_x3": 252.9,
"r_y3": 493.8,
"coord_origin": "TOPLEFT"
},
"text": ": A pop-",
"orig": ": A pop-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 514.7,
"r_x1": 286.4,
"r_y1": 514.7,
"r_x2": 286.4,
"r_y2": 505.8,
"r_x3": 50.1,
"r_y3": 505.8,
"coord_origin": "TOPLEFT"
},
"text": "ular current model for table-structure identification is the",
"orig": "ular current model for table-structure identification is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 526.6,
"r_x1": 286.4,
"r_y1": 526.6,
"r_x2": 286.4,
"r_y2": 517.7,
"r_x3": 50.1,
"r_y3": 517.7,
"coord_origin": "TOPLEFT"
},
"text": "use of a hybrid Deep Learning-Rule-Based approach similar",
"orig": "use of a hybrid Deep Learning-Rule-Based approach similar",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 538.6,
"r_x1": 286.4,
"r_y1": 538.6,
"r_x2": 286.4,
"r_y2": 529.7,
"r_x3": 50.1,
"r_y3": 529.7,
"coord_origin": "TOPLEFT"
},
"text": "to [27, 29]. In this approach, one first detects the position of",
"orig": "to [27, 29]. In this approach, one first detects the position of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 550.5,
"r_x1": 286.4,
"r_y1": 550.5,
"r_x2": 286.4,
"r_y2": 541.6,
"r_x3": 50.1,
"r_y3": 541.6,
"coord_origin": "TOPLEFT"
},
"text": "the table-cells with object detection (e.g. YoloVx or Mask-",
"orig": "the table-cells with object detection (e.g. YoloVx or Mask-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 562.5,
"r_x1": 286.4,
"r_y1": 562.5,
"r_x2": 286.4,
"r_y2": 553.6,
"r_x3": 50.1,
"r_y3": 553.6,
"coord_origin": "TOPLEFT"
},
"text": "RCNN), then classifies the table into different types (from",
"orig": "RCNN), then classifies the table into different types (from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 574.4,
"r_x1": 286.4,
"r_y1": 574.4,
"r_x2": 286.4,
"r_y2": 565.5,
"r_x3": 50.1,
"r_y3": 565.5,
"coord_origin": "TOPLEFT"
},
"text": "its images) and finally uses different rule-sets to obtain",
"orig": "its images) and finally uses different rule-sets to obtain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 586.4,
"r_x1": 286.4,
"r_y1": 586.4,
"r_x2": 286.4,
"r_y2": 577.5,
"r_x3": 50.1,
"r_y3": 577.5,
"coord_origin": "TOPLEFT"
},
"text": "its table-structure. Currently, this approach achieves state-",
"orig": "its table-structure. Currently, this approach achieves state-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 598.4,
"r_x1": 286.4,
"r_y1": 598.4,
"r_x2": 286.4,
"r_y2": 589.4,
"r_x3": 50.1,
"r_y3": 589.4,
"coord_origin": "TOPLEFT"
},
"text": "of-the-art results, but is not an end-to-end deep-learning",
"orig": "of-the-art results, but is not an end-to-end deep-learning",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 610.3,
"r_x1": 286.4,
"r_y1": 610.3,
"r_x2": 286.4,
"r_y2": 601.4,
"r_x3": 50.1,
"r_y3": 601.4,
"coord_origin": "TOPLEFT"
},
"text": "method. As such, new rules need to be written if different",
"orig": "method. As such, new rules need to be written if different",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 622.3,
"r_x1": 176.0,
"r_y1": 622.3,
"r_x2": 176.0,
"r_y2": 613.4,
"r_x3": 50.1,
"r_y3": 613.4,
"coord_origin": "TOPLEFT"
},
"text": "types of tables are encountered.",
"orig": "types of tables are encountered.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Hybrid Deep Learning-Rule-Based approach : A popular current model for table-structure identification is the use of a hybrid Deep Learning-Rule-Based approach similar to [27, 29]. In this approach, one first detects the position of the table-cells with object detection (e.g. YoloVx or MaskRCNN), then classifies the table into different types (from its images) and finally uses different rule-sets to obtain its table-structure. Currently, this approach achieves stateof-the-art results, but is not an end-to-end deep-learning method. As such, new rules need to be written if different types of tables are encountered."
},
{
"label": "section_header",
"id": 8,
"page_no": 2,
"cluster": {
"id": 8,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 635.9,
"r": 105.2,
"b": 646.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 646.7,
"r_x1": 57.8,
"r_y1": 646.7,
"r_x2": 57.8,
"r_y2": 635.9,
"r_x3": 50.1,
"r_y3": 635.9,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.1,
"r_y0": 646.7,
"r_x1": 105.2,
"r_y1": 646.7,
"r_x2": 105.2,
"r_y2": 635.9,
"r_x3": 68.1,
"r_y3": 635.9,
"coord_origin": "TOPLEFT"
},
"text": "Datasets",
"orig": "Datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "3. Datasets"
},
{
"label": "text",
"id": 3,
"page_no": 2,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 50.1,
"t": 656.4,
"r": 286.4,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 665.3,
"r_x1": 286.4,
"r_y1": 665.3,
"r_x2": 286.4,
"r_y2": 656.4,
"r_x3": 62.1,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "We rely on large-scale datasets such as PubTabNet [37],",
"orig": "We rely on large-scale datasets such as PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.3,
"r_x1": 286.4,
"r_y1": 677.3,
"r_x2": 286.4,
"r_y2": 668.4,
"r_x3": 50.1,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet [36], and TableBank [17] datasets to train and",
"orig": "FinTabNet [36], and TableBank [17] datasets to train and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 689.2,
"r_x1": 286.4,
"r_y1": 689.2,
"r_x2": 286.4,
"r_y2": 680.3,
"r_x3": 50.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "evaluate our models. These datasets span over various ap-",
"orig": "evaluate our models. These datasets span over various ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 166.2,
"r_y1": 701.2,
"r_x2": 166.2,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "pearance styles and content.",
"orig": "pearance styles and content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 173.7,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 173.7,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "We also introduce our own",
"orig": "We also introduce our own",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 286.4,
"r_y1": 713.2,
"r_x2": 286.4,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "synthetically generated SynthTabNet dataset to fix an im-",
"orig": "synthetically generated SynthTabNet dataset to fix an im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "We rely on large-scale datasets such as PubTabNet [37], FinTabNet [36], and TableBank [17] datasets to train and evaluate our models. These datasets span over various appearance styles and content. We also introduce our own synthetically generated SynthTabNet dataset to fix an im-"
},
{
"label": "picture",
"id": 6,
"page_no": 2,
"cluster": {
"id": 6,
"label": "picture",
"bbox": {
"l": 312.1,
"t": 78.4,
"r": 550.4,
"b": 250.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 380.8,
"r_y0": 88.6,
"r_x1": 486.8,
"r_y1": 88.6,
"r_x2": 486.8,
"r_y2": 79.8,
"r_x3": 380.8,
"r_y3": 79.8,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet + FinTabNet",
"orig": "PubTabNet + FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.8,
"r_y0": 250.8,
"r_x1": 469.8,
"r_y1": 250.8,
"r_x2": 469.8,
"r_y2": 242.0,
"r_x3": 396.8,
"r_y3": 242.0,
"coord_origin": "TOPLEFT"
},
"text": "Rows / Columns",
"orig": "Rows / Columns",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 321.0,
"r_y0": 239.3,
"r_x1": 324.8,
"r_y1": 239.3,
"r_x2": 324.8,
"r_y2": 233.4,
"r_x3": 321.0,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.5,
"r_y0": 239.3,
"r_x1": 418.1,
"r_y1": 239.3,
"r_x2": 418.1,
"r_y2": 233.4,
"r_x3": 410.5,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.8,
"r_y0": 239.3,
"r_x1": 508.5,
"r_y1": 239.3,
"r_x2": 508.5,
"r_y2": 233.4,
"r_x3": 500.8,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 365.3,
"r_y0": 239.3,
"r_x1": 372.9,
"r_y1": 239.3,
"r_x2": 372.9,
"r_y2": 233.4,
"r_x3": 365.3,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.7,
"r_y0": 239.3,
"r_x1": 463.3,
"r_y1": 239.3,
"r_x2": 463.3,
"r_y2": 233.4,
"r_x3": 455.7,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 542.0,
"r_y0": 239.3,
"r_x1": 549.7,
"r_y1": 239.3,
"r_x2": 549.7,
"r_y2": 233.4,
"r_x3": 542.0,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.0,
"r_y0": 236.3,
"r_x1": 319.9,
"r_y1": 236.3,
"r_x2": 319.9,
"r_y2": 230.4,
"r_x3": 316.0,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.6,
"r_y0": 204.5,
"r_x1": 316.4,
"r_y1": 204.5,
"r_x2": 316.4,
"r_y2": 198.7,
"r_x3": 312.6,
"r_y3": 198.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.4,
"r_y0": 204.5,
"r_x1": 320.3,
"r_y1": 204.5,
"r_x2": 320.3,
"r_y2": 198.7,
"r_x3": 316.4,
"r_y3": 198.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.1,
"r_y0": 173.9,
"r_x1": 317.0,
"r_y1": 173.9,
"r_x2": 317.0,
"r_y2": 168.1,
"r_x3": 313.1,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.0,
"r_y0": 173.9,
"r_x1": 320.8,
"r_y1": 173.9,
"r_x2": 320.8,
"r_y2": 168.1,
"r_x3": 317.0,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.9,
"r_y0": 142.4,
"r_x1": 316.7,
"r_y1": 142.4,
"r_x2": 316.7,
"r_y2": 136.6,
"r_x3": 312.9,
"r_y3": 136.6,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.7,
"r_y0": 142.4,
"r_x1": 320.6,
"r_y1": 142.4,
"r_x2": 320.6,
"r_y2": 136.6,
"r_x3": 316.7,
"r_y3": 136.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.5,
"r_y0": 111.4,
"r_x1": 316.3,
"r_y1": 111.4,
"r_x2": 316.3,
"r_y2": 105.6,
"r_x3": 312.5,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 111.4,
"r_x1": 320.1,
"r_y1": 111.4,
"r_x2": 320.1,
"r_y2": 105.6,
"r_x3": 316.3,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.5,
"r_y0": 218.1,
"r_x1": 316.3,
"r_y1": 218.1,
"r_x2": 316.3,
"r_y2": 212.3,
"r_x3": 312.5,
"r_y3": 212.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 218.1,
"r_x1": 320.1,
"r_y1": 218.1,
"r_x2": 320.1,
"r_y2": 212.3,
"r_x3": 316.3,
"r_y3": 212.3,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.1,
"r_y0": 189.6,
"r_x1": 316.9,
"r_y1": 189.6,
"r_x2": 316.9,
"r_y2": 183.7,
"r_x3": 313.1,
"r_y3": 183.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.9,
"r_y0": 189.6,
"r_x1": 320.7,
"r_y1": 189.6,
"r_x2": 320.7,
"r_y2": 183.7,
"r_x3": 316.9,
"r_y3": 183.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.8,
"r_y0": 158.3,
"r_x1": 316.6,
"r_y1": 158.3,
"r_x2": 316.6,
"r_y2": 152.5,
"r_x3": 312.8,
"r_y3": 152.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.6,
"r_y0": 158.3,
"r_x1": 320.4,
"r_y1": 158.3,
"r_x2": 320.4,
"r_y2": 152.5,
"r_x3": 316.6,
"r_y3": 152.5,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.2,
"r_y0": 126.4,
"r_x1": 316.0,
"r_y1": 126.4,
"r_x2": 316.0,
"r_y2": 120.6,
"r_x3": 312.2,
"r_y3": 120.6,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.0,
"r_y0": 126.4,
"r_x1": 319.8,
"r_y1": 126.4,
"r_x2": 319.8,
"r_y2": 120.6,
"r_x3": 316.0,
"r_y3": 120.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.8,
"r_y0": 95.9,
"r_x1": 316.6,
"r_y1": 95.9,
"r_x2": 316.6,
"r_y2": 90.1,
"r_x3": 312.8,
"r_y3": 90.1,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.6,
"r_y0": 95.9,
"r_x1": 320.4,
"r_y1": 95.9,
"r_x2": 320.4,
"r_y2": 90.1,
"r_x3": 316.6,
"r_y3": 90.1,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.2,
"r_y0": 230.0,
"r_x1": 536.9,
"r_y1": 230.0,
"r_x2": 536.9,
"r_y2": 222.7,
"r_x3": 532.2,
"r_y3": 222.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.9,
"r_y0": 115.6,
"r_x1": 547.6,
"r_y1": 115.6,
"r_x2": 547.6,
"r_y2": 108.3,
"r_x3": 532.9,
"r_y3": 108.3,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.8,
"r_y0": 138.1,
"r_x1": 542.7,
"r_y1": 138.1,
"r_x2": 542.7,
"r_y2": 130.8,
"r_x3": 532.8,
"r_y3": 130.8,
"coord_origin": "TOPLEFT"
},
"text": "8K",
"orig": "8K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.8,
"r_y0": 161.2,
"r_x1": 542.8,
"r_y1": 161.2,
"r_x2": 542.8,
"r_y2": 153.9,
"r_x3": 532.8,
"r_y3": 153.9,
"coord_origin": "TOPLEFT"
},
"text": "6K",
"orig": "6K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.6,
"r_y0": 184.0,
"r_x1": 542.5,
"r_y1": 184.0,
"r_x2": 542.5,
"r_y2": 176.8,
"r_x3": 532.6,
"r_y3": 176.8,
"coord_origin": "TOPLEFT"
},
"text": "4K",
"orig": "4K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.1,
"r_y0": 206.9,
"r_x1": 542.1,
"r_y1": 206.9,
"r_x2": 542.1,
"r_y2": 199.6,
"r_x3": 532.1,
"r_y3": 199.6,
"coord_origin": "TOPLEFT"
},
"text": "2K",
"orig": "2K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 12,
"label": "section_header",
"bbox": {
"l": 380.8,
"t": 79.8,
"r": 486.8,
"b": 88.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.57,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 380.8,
"r_y0": 88.6,
"r_x1": 486.8,
"r_y1": 88.6,
"r_x2": 486.8,
"r_y2": 79.8,
"r_x3": 380.8,
"r_y3": 79.8,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet + FinTabNet",
"orig": "PubTabNet + FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 16,
"label": "text",
"bbox": {
"l": 396.8,
"t": 242.0,
"r": 469.8,
"b": 250.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.8,
"r_y0": 250.8,
"r_x1": 469.8,
"r_y1": 250.8,
"r_x2": 469.8,
"r_y2": 242.0,
"r_x3": 396.8,
"r_y3": 242.0,
"coord_origin": "TOPLEFT"
},
"text": "Rows / Columns",
"orig": "Rows / Columns",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 17,
"label": "text",
"bbox": {
"l": 321.0,
"t": 233.4,
"r": 324.8,
"b": 239.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 321.0,
"r_y0": 239.3,
"r_x1": 324.8,
"r_y1": 239.3,
"r_x2": 324.8,
"r_y2": 233.4,
"r_x3": 321.0,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 18,
"label": "text",
"bbox": {
"l": 410.5,
"t": 233.4,
"r": 418.1,
"b": 239.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.5,
"r_y0": 239.3,
"r_x1": 418.1,
"r_y1": 239.3,
"r_x2": 418.1,
"r_y2": 233.4,
"r_x3": 410.5,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 19,
"label": "text",
"bbox": {
"l": 500.8,
"t": 233.4,
"r": 508.5,
"b": 239.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.8,
"r_y0": 239.3,
"r_x1": 508.5,
"r_y1": 239.3,
"r_x2": 508.5,
"r_y2": 233.4,
"r_x3": 500.8,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 20,
"label": "text",
"bbox": {
"l": 365.3,
"t": 233.4,
"r": 372.9,
"b": 239.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 365.3,
"r_y0": 239.3,
"r_x1": 372.9,
"r_y1": 239.3,
"r_x2": 372.9,
"r_y2": 233.4,
"r_x3": 365.3,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 21,
"label": "text",
"bbox": {
"l": 455.7,
"t": 233.4,
"r": 463.3,
"b": 239.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.7,
"r_y0": 239.3,
"r_x1": 463.3,
"r_y1": 239.3,
"r_x2": 463.3,
"r_y2": 233.4,
"r_x3": 455.7,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 22,
"label": "text",
"bbox": {
"l": 542.0,
"t": 233.4,
"r": 549.7,
"b": 239.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 542.0,
"r_y0": 239.3,
"r_x1": 549.7,
"r_y1": 239.3,
"r_x2": 549.7,
"r_y2": 233.4,
"r_x3": 542.0,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 23,
"label": "text",
"bbox": {
"l": 316.0,
"t": 230.4,
"r": 319.9,
"b": 236.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.0,
"r_y0": 236.3,
"r_x1": 319.9,
"r_y1": 236.3,
"r_x2": 319.9,
"r_y2": 230.4,
"r_x3": 316.0,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 24,
"label": "text",
"bbox": {
"l": 312.6,
"t": 198.7,
"r": 316.4,
"b": 204.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.6,
"r_y0": 204.5,
"r_x1": 316.4,
"r_y1": 204.5,
"r_x2": 316.4,
"r_y2": 198.7,
"r_x3": 312.6,
"r_y3": 198.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 25,
"label": "text",
"bbox": {
"l": 316.4,
"t": 198.7,
"r": 320.3,
"b": 204.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.4,
"r_y0": 204.5,
"r_x1": 320.3,
"r_y1": 204.5,
"r_x2": 320.3,
"r_y2": 198.7,
"r_x3": 316.4,
"r_y3": 198.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 26,
"label": "text",
"bbox": {
"l": 313.1,
"t": 168.1,
"r": 317.0,
"b": 173.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.1,
"r_y0": 173.9,
"r_x1": 317.0,
"r_y1": 173.9,
"r_x2": 317.0,
"r_y2": 168.1,
"r_x3": 313.1,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 27,
"label": "text",
"bbox": {
"l": 317.0,
"t": 168.1,
"r": 320.8,
"b": 173.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.0,
"r_y0": 173.9,
"r_x1": 320.8,
"r_y1": 173.9,
"r_x2": 320.8,
"r_y2": 168.1,
"r_x3": 317.0,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 28,
"label": "text",
"bbox": {
"l": 312.9,
"t": 136.6,
"r": 316.7,
"b": 142.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.9,
"r_y0": 142.4,
"r_x1": 316.7,
"r_y1": 142.4,
"r_x2": 316.7,
"r_y2": 136.6,
"r_x3": 312.9,
"r_y3": 136.6,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "text",
"bbox": {
"l": 316.7,
"t": 136.6,
"r": 320.6,
"b": 142.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.7,
"r_y0": 142.4,
"r_x1": 320.6,
"r_y1": 142.4,
"r_x2": 320.6,
"r_y2": 136.6,
"r_x3": 316.7,
"r_y3": 136.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 30,
"label": "text",
"bbox": {
"l": 312.5,
"t": 105.6,
"r": 316.3,
"b": 111.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.5,
"r_y0": 111.4,
"r_x1": 316.3,
"r_y1": 111.4,
"r_x2": 316.3,
"r_y2": 105.6,
"r_x3": 312.5,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "text",
"bbox": {
"l": 316.3,
"t": 105.6,
"r": 320.1,
"b": 111.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 111.4,
"r_x1": 320.1,
"r_y1": 111.4,
"r_x2": 320.1,
"r_y2": 105.6,
"r_x3": 316.3,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 32,
"label": "text",
"bbox": {
"l": 312.5,
"t": 212.3,
"r": 316.3,
"b": 218.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.5,
"r_y0": 218.1,
"r_x1": 316.3,
"r_y1": 218.1,
"r_x2": 316.3,
"r_y2": 212.3,
"r_x3": 312.5,
"r_y3": 212.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 33,
"label": "text",
"bbox": {
"l": 316.3,
"t": 212.3,
"r": 320.1,
"b": 218.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 218.1,
"r_x1": 320.1,
"r_y1": 218.1,
"r_x2": 320.1,
"r_y2": 212.3,
"r_x3": 316.3,
"r_y3": 212.3,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 34,
"label": "text",
"bbox": {
"l": 313.1,
"t": 183.7,
"r": 316.9,
"b": 189.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.1,
"r_y0": 189.6,
"r_x1": 316.9,
"r_y1": 189.6,
"r_x2": 316.9,
"r_y2": 183.7,
"r_x3": 313.1,
"r_y3": 183.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 35,
"label": "text",
"bbox": {
"l": 316.9,
"t": 183.7,
"r": 320.7,
"b": 189.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.9,
"r_y0": 189.6,
"r_x1": 320.7,
"r_y1": 189.6,
"r_x2": 320.7,
"r_y2": 183.7,
"r_x3": 316.9,
"r_y3": 183.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 36,
"label": "text",
"bbox": {
"l": 312.8,
"t": 152.5,
"r": 316.6,
"b": 158.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.8,
"r_y0": 158.3,
"r_x1": 316.6,
"r_y1": 158.3,
"r_x2": 316.6,
"r_y2": 152.5,
"r_x3": 312.8,
"r_y3": 152.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 37,
"label": "text",
"bbox": {
"l": 316.6,
"t": 152.5,
"r": 320.4,
"b": 158.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.6,
"r_y0": 158.3,
"r_x1": 320.4,
"r_y1": 158.3,
"r_x2": 320.4,
"r_y2": 152.5,
"r_x3": 316.6,
"r_y3": 152.5,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 38,
"label": "text",
"bbox": {
"l": 312.2,
"t": 120.6,
"r": 316.0,
"b": 126.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.2,
"r_y0": 126.4,
"r_x1": 316.0,
"r_y1": 126.4,
"r_x2": 316.0,
"r_y2": 120.6,
"r_x3": 312.2,
"r_y3": 120.6,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 39,
"label": "text",
"bbox": {
"l": 316.0,
"t": 120.6,
"r": 319.8,
"b": 126.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.0,
"r_y0": 126.4,
"r_x1": 319.8,
"r_y1": 126.4,
"r_x2": 319.8,
"r_y2": 120.6,
"r_x3": 316.0,
"r_y3": 120.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 40,
"label": "text",
"bbox": {
"l": 312.8,
"t": 90.1,
"r": 316.6,
"b": 95.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.8,
"r_y0": 95.9,
"r_x1": 316.6,
"r_y1": 95.9,
"r_x2": 316.6,
"r_y2": 90.1,
"r_x3": 312.8,
"r_y3": 90.1,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 316.6,
"t": 90.1,
"r": 320.4,
"b": 95.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.6,
"r_y0": 95.9,
"r_x1": 320.4,
"r_y1": 95.9,
"r_x2": 320.4,
"r_y2": 90.1,
"r_x3": 316.6,
"r_y3": 90.1,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 532.2,
"t": 222.7,
"r": 536.9,
"b": 230.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.2,
"r_y0": 230.0,
"r_x1": 536.9,
"r_y1": 230.0,
"r_x2": 536.9,
"r_y2": 222.7,
"r_x3": 532.2,
"r_y3": 222.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 532.9,
"t": 108.3,
"r": 547.6,
"b": 115.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.9,
"r_y0": 115.6,
"r_x1": 547.6,
"r_y1": 115.6,
"r_x2": 547.6,
"r_y2": 108.3,
"r_x3": 532.9,
"r_y3": 108.3,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 532.8,
"t": 130.8,
"r": 542.7,
"b": 138.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.8,
"r_y0": 138.1,
"r_x1": 542.7,
"r_y1": 138.1,
"r_x2": 542.7,
"r_y2": 130.8,
"r_x3": 532.8,
"r_y3": 130.8,
"coord_origin": "TOPLEFT"
},
"text": "8K",
"orig": "8K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 532.8,
"t": 153.9,
"r": 542.8,
"b": 161.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.8,
"r_y0": 161.2,
"r_x1": 542.8,
"r_y1": 161.2,
"r_x2": 542.8,
"r_y2": 153.9,
"r_x3": 532.8,
"r_y3": 153.9,
"coord_origin": "TOPLEFT"
},
"text": "6K",
"orig": "6K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 532.6,
"t": 176.8,
"r": 542.5,
"b": 184.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.6,
"r_y0": 184.0,
"r_x1": 542.5,
"r_y1": 184.0,
"r_x2": 542.5,
"r_y2": 176.8,
"r_x3": 532.6,
"r_y3": 176.8,
"coord_origin": "TOPLEFT"
},
"text": "4K",
"orig": "4K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 532.1,
"t": 199.6,
"r": 542.1,
"b": 206.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.1,
"r_y0": 206.9,
"r_x1": 542.1,
"r_y1": 206.9,
"r_x2": 542.1,
"r_y2": 199.6,
"r_x3": 532.1,
"r_y3": 199.6,
"coord_origin": "TOPLEFT"
},
"text": "2K",
"orig": "2K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "caption",
"id": 7,
"page_no": 2,
"cluster": {
"id": 7,
"label": "caption",
"bbox": {
"l": 308.9,
"t": 267.8,
"r": 545.1,
"b": 288.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 276.7,
"r_x1": 346.1,
"r_y1": 276.7,
"r_x2": 346.1,
"r_y2": 267.8,
"r_x3": 308.9,
"r_y3": 267.8,
"coord_origin": "TOPLEFT"
},
"text": "Figure 2:",
"orig": "Figure 2:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.5,
"r_y0": 276.7,
"r_x1": 545.1,
"r_y1": 276.7,
"r_x2": 545.1,
"r_y2": 267.8,
"r_x3": 354.5,
"r_y3": 267.8,
"coord_origin": "TOPLEFT"
},
"text": "Distribution of the tables across different table",
"orig": "Distribution of the tables across different table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 288.7,
"r_x1": 498.6,
"r_y1": 288.7,
"r_x2": 498.6,
"r_y2": 279.8,
"r_x3": 308.9,
"r_y3": 279.8,
"coord_origin": "TOPLEFT"
},
"text": "dimensions in PubTabNet + FinTabNet datasets",
"orig": "dimensions in PubTabNet + FinTabNet datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 2: Distribution of the tables across different table dimensions in PubTabNet + FinTabNet datasets"
},
{
"label": "text",
"id": 9,
"page_no": 2,
"cluster": {
"id": 9,
"label": "text",
"bbox": {
"l": 308.9,
"t": 317.5,
"r": 437.3,
"b": 326.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 326.4,
"r_x1": 437.3,
"r_y1": 326.4,
"r_x2": 437.3,
"r_y2": 317.5,
"r_x3": 308.9,
"r_y3": 317.5,
"coord_origin": "TOPLEFT"
},
"text": "balance in the previous datasets.",
"orig": "balance in the previous datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "balance in the previous datasets."
},
{
"label": "text",
"id": 2,
"page_no": 2,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 308.9,
"t": 331.5,
"r": 545.1,
"b": 627.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 340.4,
"r_x1": 545.1,
"r_y1": 340.4,
"r_x2": 545.1,
"r_y2": 331.5,
"r_x3": 320.8,
"r_y3": 331.5,
"coord_origin": "TOPLEFT"
},
"text": "The PubTabNet dataset contains 509k tables delivered as",
"orig": "The PubTabNet dataset contains 509k tables delivered as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 352.4,
"r_x1": 545.1,
"r_y1": 352.4,
"r_x2": 545.1,
"r_y2": 343.5,
"r_x3": 308.9,
"r_y3": 343.5,
"coord_origin": "TOPLEFT"
},
"text": "annotated PNG images. The annotations consist of the table",
"orig": "annotated PNG images. The annotations consist of the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 364.3,
"r_x1": 545.1,
"r_y1": 364.3,
"r_x2": 545.1,
"r_y2": 355.4,
"r_x3": 308.9,
"r_y3": 355.4,
"coord_origin": "TOPLEFT"
},
"text": "structure represented in HTML format, the tokenized text",
"orig": "structure represented in HTML format, the tokenized text",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 376.3,
"r_x1": 545.1,
"r_y1": 376.3,
"r_x2": 545.1,
"r_y2": 367.4,
"r_x3": 308.9,
"r_y3": 367.4,
"coord_origin": "TOPLEFT"
},
"text": "and its bounding boxes per table cell. Fig. 1 shows the ap-",
"orig": "and its bounding boxes per table cell. Fig. 1 shows the ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 388.3,
"r_x1": 545.1,
"r_y1": 388.3,
"r_x2": 545.1,
"r_y2": 379.4,
"r_x3": 308.9,
"r_y3": 379.4,
"coord_origin": "TOPLEFT"
},
"text": "pearance style of PubTabNet. Depending on its complexity,",
"orig": "pearance style of PubTabNet. Depending on its complexity,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 400.2,
"r_x1": 545.1,
"r_y1": 400.2,
"r_x2": 545.1,
"r_y2": 391.3,
"r_x3": 308.9,
"r_y3": 391.3,
"coord_origin": "TOPLEFT"
},
"text": "a table is characterized as \u201csimple\u201d when it does not contain",
"orig": "a table is characterized as \u201csimple\u201d when it does not contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 412.2,
"r_x1": 545.1,
"r_y1": 412.2,
"r_x2": 545.1,
"r_y2": 403.3,
"r_x3": 308.9,
"r_y3": 403.3,
"coord_origin": "TOPLEFT"
},
"text": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The",
"orig": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 424.1,
"r_x1": 545.1,
"r_y1": 424.1,
"r_x2": 545.1,
"r_y2": 415.2,
"r_x3": 308.9,
"r_y3": 415.2,
"coord_origin": "TOPLEFT"
},
"text": "dataset is divided into Train and Val splits (roughly 98% and",
"orig": "dataset is divided into Train and Val splits (roughly 98% and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 436.1,
"r_x1": 545.1,
"r_y1": 436.1,
"r_x2": 545.1,
"r_y2": 427.2,
"r_x3": 308.9,
"r_y3": 427.2,
"coord_origin": "TOPLEFT"
},
"text": "2%). The Train split consists of 54% simple and 46% com-",
"orig": "2%). The Train split consists of 54% simple and 46% com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 448.0,
"r_x1": 545.1,
"r_y1": 448.0,
"r_x2": 545.1,
"r_y2": 439.1,
"r_x3": 308.9,
"r_y3": 439.1,
"coord_origin": "TOPLEFT"
},
"text": "plex tables and the Val split of 51% and 49% respectively.",
"orig": "plex tables and the Val split of 51% and 49% respectively.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 460.0,
"r_x1": 545.1,
"r_y1": 460.0,
"r_x2": 545.1,
"r_y2": 451.1,
"r_x3": 308.9,
"r_y3": 451.1,
"coord_origin": "TOPLEFT"
},
"text": "The FinTabNet dataset contains 112k tables delivered as",
"orig": "The FinTabNet dataset contains 112k tables delivered as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 471.9,
"r_x1": 545.1,
"r_y1": 471.9,
"r_x2": 545.1,
"r_y2": 463.0,
"r_x3": 308.9,
"r_y3": 463.0,
"coord_origin": "TOPLEFT"
},
"text": "single-page PDF documents with mixed table structures and",
"orig": "single-page PDF documents with mixed table structures and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 483.9,
"r_x1": 545.1,
"r_y1": 483.9,
"r_x2": 545.1,
"r_y2": 475.0,
"r_x3": 308.9,
"r_y3": 475.0,
"coord_origin": "TOPLEFT"
},
"text": "text content. Similarly to the PubTabNet, the annotations",
"orig": "text content. Similarly to the PubTabNet, the annotations",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 495.9,
"r_x1": 545.1,
"r_y1": 495.9,
"r_x2": 545.1,
"r_y2": 486.9,
"r_x3": 308.9,
"r_y3": 486.9,
"coord_origin": "TOPLEFT"
},
"text": "of FinTabNet include the table structure in HTML, the to-",
"orig": "of FinTabNet include the table structure in HTML, the to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 507.8,
"r_x1": 545.1,
"r_y1": 507.8,
"r_x2": 545.1,
"r_y2": 498.9,
"r_x3": 308.9,
"r_y3": 498.9,
"coord_origin": "TOPLEFT"
},
"text": "kenized text and the bounding boxes on a table cell basis.",
"orig": "kenized text and the bounding boxes on a table cell basis.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 519.8,
"r_x1": 545.1,
"r_y1": 519.8,
"r_x2": 545.1,
"r_y2": 510.9,
"r_x3": 308.9,
"r_y3": 510.9,
"coord_origin": "TOPLEFT"
},
"text": "The dataset is divided into Train, Test and Val splits (81%,",
"orig": "The dataset is divided into Train, Test and Val splits (81%,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 531.7,
"r_x1": 545.1,
"r_y1": 531.7,
"r_x2": 545.1,
"r_y2": 522.8,
"r_x3": 308.9,
"r_y3": 522.8,
"coord_origin": "TOPLEFT"
},
"text": "9.5%, 9.5%), and each one is almost equally divided into",
"orig": "9.5%, 9.5%), and each one is almost equally divided into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 543.7,
"r_x1": 545.1,
"r_y1": 543.7,
"r_x2": 545.1,
"r_y2": 534.8,
"r_x3": 308.9,
"r_y3": 534.8,
"coord_origin": "TOPLEFT"
},
"text": "simple and complex tables (Train: 48% simple, 52% com-",
"orig": "simple and complex tables (Train: 48% simple, 52% com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 555.6,
"r_x1": 545.1,
"r_y1": 555.6,
"r_x2": 545.1,
"r_y2": 546.7,
"r_x3": 308.9,
"r_y3": 546.7,
"coord_origin": "TOPLEFT"
},
"text": "plex, Test: 48% simple, 52% complex, Test: 53% simple,",
"orig": "plex, Test: 48% simple, 52% complex, Test: 53% simple,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 567.6,
"r_x1": 545.1,
"r_y1": 567.6,
"r_x2": 545.1,
"r_y2": 558.7,
"r_x3": 308.9,
"r_y3": 558.7,
"coord_origin": "TOPLEFT"
},
"text": "47% complex). Finally the TableBank dataset consists of",
"orig": "47% complex). Finally the TableBank dataset consists of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 579.5,
"r_x1": 545.1,
"r_y1": 579.5,
"r_x2": 545.1,
"r_y2": 570.6,
"r_x3": 308.9,
"r_y3": 570.6,
"coord_origin": "TOPLEFT"
},
"text": "145k tables provided as JPEG images. The latter has anno-",
"orig": "145k tables provided as JPEG images. The latter has anno-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 591.5,
"r_x1": 545.1,
"r_y1": 591.5,
"r_x2": 545.1,
"r_y2": 582.6,
"r_x3": 308.9,
"r_y3": 582.6,
"coord_origin": "TOPLEFT"
},
"text": "tations for the table structure, but only few with bounding",
"orig": "tations for the table structure, but only few with bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 603.5,
"r_x1": 545.1,
"r_y1": 603.5,
"r_x2": 545.1,
"r_y2": 594.5,
"r_x3": 308.9,
"r_y3": 594.5,
"coord_origin": "TOPLEFT"
},
"text": "boxes of the table cells. The entire dataset consists of sim-",
"orig": "boxes of the table cells. The entire dataset consists of sim-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 615.4,
"r_x1": 545.1,
"r_y1": 615.4,
"r_x2": 545.1,
"r_y2": 606.5,
"r_x3": 308.9,
"r_y3": 606.5,
"coord_origin": "TOPLEFT"
},
"text": "ple tables and it is divided into 90% Train, 3% Test and 7%",
"orig": "ple tables and it is divided into 90% Train, 3% Test and 7%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 627.4,
"r_x1": 348.2,
"r_y1": 627.4,
"r_x2": 348.2,
"r_y2": 618.5,
"r_x3": 308.9,
"r_y3": 618.5,
"coord_origin": "TOPLEFT"
},
"text": "Val splits.",
"orig": "Val splits.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The PubTabNet dataset contains 509k tables delivered as annotated PNG images. The annotations consist of the table structure represented in HTML format, the tokenized text and its bounding boxes per table cell. Fig. 1 shows the appearance style of PubTabNet. Depending on its complexity, a table is characterized as \"simple\" when it does not contain row spans or column spans, otherwise it is \"complex\". The dataset is divided into Train and Val splits (roughly 98% and 2%). The Train split consists of 54% simple and 46% complex tables and the Val split of 51% and 49% respectively. The FinTabNet dataset contains 112k tables delivered as single-page PDF documents with mixed table structures and text content. Similarly to the PubTabNet, the annotations of FinTabNet include the table structure in HTML, the tokenized text and the bounding boxes on a table cell basis. The dataset is divided into Train, Test and Val splits (81%, 9.5%, 9.5%), and each one is almost equally divided into simple and complex tables (Train: 48% simple, 52% complex, Test: 48% simple, 52% complex, Test: 53% simple, 47% complex). Finally the TableBank dataset consists of 145k tables provided as JPEG images. The latter has annotations for the table structure, but only few with bounding boxes of the table cells. The entire dataset consists of simple tables and it is divided into 90% Train, 3% Test and 7% Val splits."
},
{
"label": "text",
"id": 4,
"page_no": 2,
"cluster": {
"id": 4,
"label": "text",
"bbox": {
"l": 308.9,
"t": 632.5,
"r": 545.1,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 641.4,
"r_x1": 545.1,
"r_y1": 641.4,
"r_x2": 545.1,
"r_y2": 632.5,
"r_x3": 320.8,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": "Due to the heterogeneity across the dataset formats, it",
"orig": "Due to the heterogeneity across the dataset formats, it",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 653.4,
"r_x1": 545.1,
"r_y1": 653.4,
"r_x2": 545.1,
"r_y2": 644.5,
"r_x3": 308.9,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "was necessary to combine all available data into one homog-",
"orig": "was necessary to combine all available data into one homog-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 665.3,
"r_x1": 545.1,
"r_y1": 665.3,
"r_x2": 545.1,
"r_y2": 656.4,
"r_x3": 308.9,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "enized dataset before we could train our models for practi-",
"orig": "enized dataset before we could train our models for practi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 677.3,
"r_x1": 545.1,
"r_y1": 677.3,
"r_x2": 545.1,
"r_y2": 668.4,
"r_x3": 308.9,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "cal purposes. Given the size of PubTabNet, we adopted its",
"orig": "cal purposes. Given the size of PubTabNet, we adopted its",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 689.2,
"r_x1": 545.1,
"r_y1": 689.2,
"r_x2": 545.1,
"r_y2": 680.3,
"r_x3": 308.9,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "annotation format and we extracted and converted all tables",
"orig": "annotation format and we extracted and converted all tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 308.9,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "as PNG images with a resolution of 72 dpi. Additionally,",
"orig": "as PNG images with a resolution of 72 dpi. Additionally,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 545.1,
"r_y1": 713.2,
"r_x2": 545.1,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "we have filtered out tables with extreme sizes due to small",
"orig": "we have filtered out tables with extreme sizes due to small",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Due to the heterogeneity across the dataset formats, it was necessary to combine all available data into one homogenized dataset before we could train our models for practical purposes. Given the size of PubTabNet, we adopted its annotation format and we extracted and converted all tables as PNG images with a resolution of 72 dpi. Additionally, we have filtered out tables with extreme sizes due to small"
},
{
"label": "page_footer",
"id": 11,
"page_no": 2,
"cluster": {
"id": 11,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.87,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "3"
}
],
"body": [
{
"label": "text",
"id": 10,
"page_no": 2,
"cluster": {
"id": 10,
"label": "text",
"bbox": {
"l": 50.1,
"t": 75.2,
"r": 250.2,
"b": 84.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.1,
"r_x1": 250.2,
"r_y1": 84.1,
"r_x2": 250.2,
"r_y2": 75.2,
"r_x3": 50.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "tag-decoder which is constrained to the table-tags.",
"orig": "tag-decoder which is constrained to the table-tags.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "tag-decoder which is constrained to the table-tags."
},
{
"label": "text",
"id": 5,
"page_no": 2,
"cluster": {
"id": 5,
"label": "text",
"bbox": {
"l": 50.1,
"t": 87.2,
"r": 286.4,
"b": 275.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 96.1,
"r_x1": 70.4,
"r_y1": 96.1,
"r_x2": 70.4,
"r_y2": 87.2,
"r_x3": 62.1,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.9,
"r_y0": 96.1,
"r_x1": 111.0,
"r_y1": 96.1,
"r_x2": 111.0,
"r_y2": 87.2,
"r_x3": 76.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "practice,",
"orig": "practice,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 118.5,
"r_y0": 96.1,
"r_x1": 136.3,
"r_y1": 96.1,
"r_x2": 136.3,
"r_y2": 87.2,
"r_x3": 118.5,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "both",
"orig": "both",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 142.8,
"r_y0": 96.1,
"r_x1": 175.4,
"r_y1": 96.1,
"r_x2": 175.4,
"r_y2": 87.2,
"r_x3": 142.8,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "network",
"orig": "network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 181.9,
"r_y0": 96.1,
"r_x1": 232.8,
"r_y1": 96.1,
"r_x2": 232.8,
"r_y2": 87.2,
"r_x3": 181.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "architectures",
"orig": "architectures",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.4,
"r_y0": 96.1,
"r_x1": 265.4,
"r_y1": 96.1,
"r_x2": 265.4,
"r_y2": 87.2,
"r_x3": 239.4,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "(IETD",
"orig": "(IETD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 272.0,
"r_y0": 96.1,
"r_x1": 286.4,
"r_y1": 96.1,
"r_x2": 286.4,
"r_y2": 87.2,
"r_x3": 272.0,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 108.1,
"r_x1": 286.4,
"r_y1": 108.1,
"r_x2": 286.4,
"r_y2": 99.2,
"r_x3": 50.1,
"r_y3": 99.2,
"coord_origin": "TOPLEFT"
},
"text": "IEDD) require an implicit, custom trained object-character-",
"orig": "IEDD) require an implicit, custom trained object-character-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 120.0,
"r_x1": 286.4,
"r_y1": 120.0,
"r_x2": 286.4,
"r_y2": 111.1,
"r_x3": 50.1,
"r_y3": 111.1,
"coord_origin": "TOPLEFT"
},
"text": "recognition (OCR) to obtain the content of the table-cells.",
"orig": "recognition (OCR) to obtain the content of the table-cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 132.0,
"r_x1": 286.4,
"r_y1": 132.0,
"r_x2": 286.4,
"r_y2": 123.1,
"r_x3": 50.1,
"r_y3": 123.1,
"coord_origin": "TOPLEFT"
},
"text": "In the case of IETD, this OCR engine is implicit in the de-",
"orig": "In the case of IETD, this OCR engine is implicit in the de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 143.9,
"r_x1": 286.4,
"r_y1": 143.9,
"r_x2": 286.4,
"r_y2": 135.0,
"r_x3": 50.1,
"r_y3": 135.0,
"coord_origin": "TOPLEFT"
},
"text": "coder similar to [24]. For the IEDD, the OCR is solely em-",
"orig": "coder similar to [24]. For the IEDD, the OCR is solely em-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 155.9,
"r_x1": 286.4,
"r_y1": 155.9,
"r_x2": 286.4,
"r_y2": 147.0,
"r_x3": 50.1,
"r_y3": 147.0,
"coord_origin": "TOPLEFT"
},
"text": "bedded in the content-decoder. This reliance on a custom,",
"orig": "bedded in the content-decoder. This reliance on a custom,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 167.9,
"r_x1": 286.4,
"r_y1": 167.9,
"r_x2": 286.4,
"r_y2": 159.0,
"r_x3": 50.1,
"r_y3": 159.0,
"coord_origin": "TOPLEFT"
},
"text": "implicit OCR decoder is of course problematic. OCR is a",
"orig": "implicit OCR decoder is of course problematic. OCR is a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 179.8,
"r_x1": 286.4,
"r_y1": 179.8,
"r_x2": 286.4,
"r_y2": 170.9,
"r_x3": 50.1,
"r_y3": 170.9,
"coord_origin": "TOPLEFT"
},
"text": "well known and extremely tough problem, that often needs",
"orig": "well known and extremely tough problem, that often needs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 191.8,
"r_x1": 286.4,
"r_y1": 191.8,
"r_x2": 286.4,
"r_y2": 182.9,
"r_x3": 50.1,
"r_y3": 182.9,
"coord_origin": "TOPLEFT"
},
"text": "custom training for each individual language. However, the",
"orig": "custom training for each individual language. However, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 203.7,
"r_x1": 286.4,
"r_y1": 203.7,
"r_x2": 286.4,
"r_y2": 194.8,
"r_x3": 50.1,
"r_y3": 194.8,
"coord_origin": "TOPLEFT"
},
"text": "limited availability for non-english content in the current",
"orig": "limited availability for non-english content in the current",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 215.7,
"r_x1": 286.4,
"r_y1": 215.7,
"r_x2": 286.4,
"r_y2": 206.8,
"r_x3": 50.1,
"r_y3": 206.8,
"coord_origin": "TOPLEFT"
},
"text": "datasets, makes it impractical to apply the IETD and IEDD",
"orig": "datasets, makes it impractical to apply the IETD and IEDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 227.6,
"r_x1": 286.4,
"r_y1": 227.6,
"r_x2": 286.4,
"r_y2": 218.7,
"r_x3": 50.1,
"r_y3": 218.7,
"coord_origin": "TOPLEFT"
},
"text": "methods on tables with other languages. Additionally, OCR",
"orig": "methods on tables with other languages. Additionally, OCR",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 239.6,
"r_x1": 286.4,
"r_y1": 239.6,
"r_x2": 286.4,
"r_y2": 230.7,
"r_x3": 50.1,
"r_y3": 230.7,
"coord_origin": "TOPLEFT"
},
"text": "can be completely omitted if the tables originate from pro-",
"orig": "can be completely omitted if the tables originate from pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 251.5,
"r_x1": 286.4,
"r_y1": 251.5,
"r_x2": 286.4,
"r_y2": 242.6,
"r_x3": 50.1,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "grammatic PDF documents with known positions of each",
"orig": "grammatic PDF documents with known positions of each",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 263.5,
"r_x1": 286.4,
"r_y1": 263.5,
"r_x2": 286.4,
"r_y2": 254.6,
"r_x3": 50.1,
"r_y3": 254.6,
"coord_origin": "TOPLEFT"
},
"text": "cell. The latter was the inspiration for the work of this pa-",
"orig": "cell. The latter was the inspiration for the work of this pa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 275.5,
"r_x1": 64.8,
"r_y1": 275.5,
"r_x2": 64.8,
"r_y2": 266.5,
"r_x3": 50.1,
"r_y3": 266.5,
"coord_origin": "TOPLEFT"
},
"text": "per.",
"orig": "per.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "In practice, both network architectures (IETD and IEDD) require an implicit, custom trained object-characterrecognition (OCR) to obtain the content of the table-cells. In the case of IETD, this OCR engine is implicit in the decoder similar to [24]. For the IEDD, the OCR is solely embedded in the content-decoder. This reliance on a custom, implicit OCR decoder is of course problematic. OCR is a well known and extremely tough problem, that often needs custom training for each individual language. However, the limited availability for non-english content in the current datasets, makes it impractical to apply the IETD and IEDD methods on tables with other languages. Additionally, OCR can be completely omitted if the tables originate from programmatic PDF documents with known positions of each cell. The latter was the inspiration for the work of this paper."
},
{
"label": "text",
"id": 0,
"page_no": 2,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 50.1,
"t": 278.4,
"r": 286.4,
"b": 490.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 287.4,
"r_x1": 171.6,
"r_y1": 287.4,
"r_x2": 171.6,
"r_y2": 278.4,
"r_x3": 62.1,
"r_y3": 278.4,
"coord_origin": "TOPLEFT"
},
"text": "Graph Neural networks",
"orig": "Graph Neural networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.6,
"r_y0": 287.5,
"r_x1": 174.3,
"r_y1": 287.5,
"r_x2": 174.3,
"r_y2": 278.6,
"r_x3": 171.6,
"r_y3": 278.6,
"coord_origin": "TOPLEFT"
},
"text": ":",
"orig": ":",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.2,
"r_y0": 287.5,
"r_x1": 286.4,
"r_y1": 287.5,
"r_x2": 286.4,
"r_y2": 278.6,
"r_x3": 185.2,
"r_y3": 278.6,
"coord_origin": "TOPLEFT"
},
"text": "Graph Neural networks",
"orig": "Graph Neural networks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 299.4,
"r_x1": 286.4,
"r_y1": 299.4,
"r_x2": 286.4,
"r_y2": 290.5,
"r_x3": 50.1,
"r_y3": 290.5,
"coord_origin": "TOPLEFT"
},
"text": "(GNN\u2019s) take a radically different approach to table-",
"orig": "(GNN\u2019s) take a radically different approach to table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 311.4,
"r_x1": 131.2,
"r_y1": 311.4,
"r_x2": 131.2,
"r_y2": 302.5,
"r_x3": 50.1,
"r_y3": 302.5,
"coord_origin": "TOPLEFT"
},
"text": "structure extraction.",
"orig": "structure extraction.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.8,
"r_y0": 311.4,
"r_x1": 286.4,
"r_y1": 311.4,
"r_x2": 286.4,
"r_y2": 302.5,
"r_x3": 138.8,
"r_y3": 302.5,
"coord_origin": "TOPLEFT"
},
"text": "Note that one table cell can consti-",
"orig": "Note that one table cell can consti-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 323.3,
"r_x1": 286.4,
"r_y1": 323.3,
"r_x2": 286.4,
"r_y2": 314.4,
"r_x3": 50.1,
"r_y3": 314.4,
"coord_origin": "TOPLEFT"
},
"text": "tute out of multiple text-cells. To obtain the table-structure,",
"orig": "tute out of multiple text-cells. To obtain the table-structure,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 335.3,
"r_x1": 286.4,
"r_y1": 335.3,
"r_x2": 286.4,
"r_y2": 326.4,
"r_x3": 50.1,
"r_y3": 326.4,
"coord_origin": "TOPLEFT"
},
"text": "one creates an initial graph, where each of the text-cells",
"orig": "one creates an initial graph, where each of the text-cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 347.2,
"r_x1": 286.4,
"r_y1": 347.2,
"r_x2": 286.4,
"r_y2": 338.3,
"r_x3": 50.1,
"r_y3": 338.3,
"coord_origin": "TOPLEFT"
},
"text": "becomes a node in the graph similar to [33, 34, 2]. Each",
"orig": "becomes a node in the graph similar to [33, 34, 2]. Each",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 359.2,
"r_x1": 286.4,
"r_y1": 359.2,
"r_x2": 286.4,
"r_y2": 350.3,
"r_x3": 50.1,
"r_y3": 350.3,
"coord_origin": "TOPLEFT"
},
"text": "node is then associated with en embedding vector coming",
"orig": "node is then associated with en embedding vector coming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 371.2,
"r_x1": 286.4,
"r_y1": 371.2,
"r_x2": 286.4,
"r_y2": 362.2,
"r_x3": 50.1,
"r_y3": 362.2,
"coord_origin": "TOPLEFT"
},
"text": "from the encoded image, its coordinates and the encoded",
"orig": "from the encoded image, its coordinates and the encoded",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 383.1,
"r_x1": 286.4,
"r_y1": 383.1,
"r_x2": 286.4,
"r_y2": 374.2,
"r_x3": 50.1,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "text. Furthermore, nodes that represent adjacent text-cells",
"orig": "text. Furthermore, nodes that represent adjacent text-cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 395.1,
"r_x1": 286.4,
"r_y1": 395.1,
"r_x2": 286.4,
"r_y2": 386.2,
"r_x3": 50.1,
"r_y3": 386.2,
"coord_origin": "TOPLEFT"
},
"text": "are linked. Graph Convolutional Networks (GCN\u2019s) based",
"orig": "are linked. Graph Convolutional Networks (GCN\u2019s) based",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 407.0,
"r_x1": 286.4,
"r_y1": 407.0,
"r_x2": 286.4,
"r_y2": 398.1,
"r_x3": 50.1,
"r_y3": 398.1,
"coord_origin": "TOPLEFT"
},
"text": "methods take the image as an input, but also the position of",
"orig": "methods take the image as an input, but also the position of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 419.0,
"r_x1": 286.4,
"r_y1": 419.0,
"r_x2": 286.4,
"r_y2": 410.1,
"r_x3": 50.1,
"r_y3": 410.1,
"coord_origin": "TOPLEFT"
},
"text": "the text-cells and their content [18]. The purpose of a GCN",
"orig": "the text-cells and their content [18]. The purpose of a GCN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 430.9,
"r_x1": 286.4,
"r_y1": 430.9,
"r_x2": 286.4,
"r_y2": 422.0,
"r_x3": 50.1,
"r_y3": 422.0,
"coord_origin": "TOPLEFT"
},
"text": "is to transform the input graph into a new graph, which re-",
"orig": "is to transform the input graph into a new graph, which re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 442.9,
"r_x1": 198.2,
"r_y1": 442.9,
"r_x2": 198.2,
"r_y2": 434.0,
"r_x3": 50.1,
"r_y3": 434.0,
"coord_origin": "TOPLEFT"
},
"text": "places the old links with new ones.",
"orig": "places the old links with new ones.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 205.9,
"r_y0": 442.9,
"r_x1": 286.4,
"r_y1": 442.9,
"r_x2": 286.4,
"r_y2": 434.0,
"r_x3": 205.9,
"r_y3": 434.0,
"coord_origin": "TOPLEFT"
},
"text": "The new links then",
"orig": "The new links then",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 454.8,
"r_x1": 286.4,
"r_y1": 454.8,
"r_x2": 286.4,
"r_y2": 445.9,
"r_x3": 50.1,
"r_y3": 445.9,
"coord_origin": "TOPLEFT"
},
"text": "represent the table-structure. With this approach, one can",
"orig": "represent the table-structure. With this approach, one can",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 466.8,
"r_x1": 286.4,
"r_y1": 466.8,
"r_x2": 286.4,
"r_y2": 457.9,
"r_x3": 50.1,
"r_y3": 457.9,
"coord_origin": "TOPLEFT"
},
"text": "avoid the need to build custom OCR decoders. However,",
"orig": "avoid the need to build custom OCR decoders. However,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 478.7,
"r_x1": 286.4,
"r_y1": 478.7,
"r_x2": 286.4,
"r_y2": 469.8,
"r_x3": 50.1,
"r_y3": 469.8,
"coord_origin": "TOPLEFT"
},
"text": "the quality of the reconstructed structure is not comparable",
"orig": "the quality of the reconstructed structure is not comparable",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 490.7,
"r_x1": 186.5,
"r_y1": 490.7,
"r_x2": 186.5,
"r_y2": 481.8,
"r_x3": 50.1,
"r_y3": 481.8,
"coord_origin": "TOPLEFT"
},
"text": "to the current state-of-the-art [18].",
"orig": "to the current state-of-the-art [18].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Graph Neural networks : Graph Neural networks (GNN's) take a radically different approach to tablestructure extraction. Note that one table cell can constitute out of multiple text-cells. To obtain the table-structure, one creates an initial graph, where each of the text-cells becomes a node in the graph similar to [33, 34, 2]. Each node is then associated with en embedding vector coming from the encoded image, its coordinates and the encoded text. Furthermore, nodes that represent adjacent text-cells are linked. Graph Convolutional Networks (GCN's) based methods take the image as an input, but also the position of the text-cells and their content [18]. The purpose of a GCN is to transform the input graph into a new graph, which replaces the old links with new ones. The new links then represent the table-structure. With this approach, one can avoid the need to build custom OCR decoders. However, the quality of the reconstructed structure is not comparable to the current state-of-the-art [18]."
},
{
"label": "text",
"id": 1,
"page_no": 2,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.1,
"t": 493.7,
"r": 286.4,
"b": 622.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 502.6,
"r_x1": 252.9,
"r_y1": 502.6,
"r_x2": 252.9,
"r_y2": 493.7,
"r_x3": 62.1,
"r_y3": 493.7,
"coord_origin": "TOPLEFT"
},
"text": "Hybrid Deep Learning-Rule-Based approach",
"orig": "Hybrid Deep Learning-Rule-Based approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 252.9,
"r_y0": 502.7,
"r_x1": 286.4,
"r_y1": 502.7,
"r_x2": 286.4,
"r_y2": 493.8,
"r_x3": 252.9,
"r_y3": 493.8,
"coord_origin": "TOPLEFT"
},
"text": ": A pop-",
"orig": ": A pop-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 514.7,
"r_x1": 286.4,
"r_y1": 514.7,
"r_x2": 286.4,
"r_y2": 505.8,
"r_x3": 50.1,
"r_y3": 505.8,
"coord_origin": "TOPLEFT"
},
"text": "ular current model for table-structure identification is the",
"orig": "ular current model for table-structure identification is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 526.6,
"r_x1": 286.4,
"r_y1": 526.6,
"r_x2": 286.4,
"r_y2": 517.7,
"r_x3": 50.1,
"r_y3": 517.7,
"coord_origin": "TOPLEFT"
},
"text": "use of a hybrid Deep Learning-Rule-Based approach similar",
"orig": "use of a hybrid Deep Learning-Rule-Based approach similar",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 538.6,
"r_x1": 286.4,
"r_y1": 538.6,
"r_x2": 286.4,
"r_y2": 529.7,
"r_x3": 50.1,
"r_y3": 529.7,
"coord_origin": "TOPLEFT"
},
"text": "to [27, 29]. In this approach, one first detects the position of",
"orig": "to [27, 29]. In this approach, one first detects the position of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 550.5,
"r_x1": 286.4,
"r_y1": 550.5,
"r_x2": 286.4,
"r_y2": 541.6,
"r_x3": 50.1,
"r_y3": 541.6,
"coord_origin": "TOPLEFT"
},
"text": "the table-cells with object detection (e.g. YoloVx or Mask-",
"orig": "the table-cells with object detection (e.g. YoloVx or Mask-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 562.5,
"r_x1": 286.4,
"r_y1": 562.5,
"r_x2": 286.4,
"r_y2": 553.6,
"r_x3": 50.1,
"r_y3": 553.6,
"coord_origin": "TOPLEFT"
},
"text": "RCNN), then classifies the table into different types (from",
"orig": "RCNN), then classifies the table into different types (from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 574.4,
"r_x1": 286.4,
"r_y1": 574.4,
"r_x2": 286.4,
"r_y2": 565.5,
"r_x3": 50.1,
"r_y3": 565.5,
"coord_origin": "TOPLEFT"
},
"text": "its images) and finally uses different rule-sets to obtain",
"orig": "its images) and finally uses different rule-sets to obtain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 586.4,
"r_x1": 286.4,
"r_y1": 586.4,
"r_x2": 286.4,
"r_y2": 577.5,
"r_x3": 50.1,
"r_y3": 577.5,
"coord_origin": "TOPLEFT"
},
"text": "its table-structure. Currently, this approach achieves state-",
"orig": "its table-structure. Currently, this approach achieves state-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 598.4,
"r_x1": 286.4,
"r_y1": 598.4,
"r_x2": 286.4,
"r_y2": 589.4,
"r_x3": 50.1,
"r_y3": 589.4,
"coord_origin": "TOPLEFT"
},
"text": "of-the-art results, but is not an end-to-end deep-learning",
"orig": "of-the-art results, but is not an end-to-end deep-learning",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 610.3,
"r_x1": 286.4,
"r_y1": 610.3,
"r_x2": 286.4,
"r_y2": 601.4,
"r_x3": 50.1,
"r_y3": 601.4,
"coord_origin": "TOPLEFT"
},
"text": "method. As such, new rules need to be written if different",
"orig": "method. As such, new rules need to be written if different",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 622.3,
"r_x1": 176.0,
"r_y1": 622.3,
"r_x2": 176.0,
"r_y2": 613.4,
"r_x3": 50.1,
"r_y3": 613.4,
"coord_origin": "TOPLEFT"
},
"text": "types of tables are encountered.",
"orig": "types of tables are encountered.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Hybrid Deep Learning-Rule-Based approach : A popular current model for table-structure identification is the use of a hybrid Deep Learning-Rule-Based approach similar to [27, 29]. In this approach, one first detects the position of the table-cells with object detection (e.g. YoloVx or MaskRCNN), then classifies the table into different types (from its images) and finally uses different rule-sets to obtain its table-structure. Currently, this approach achieves stateof-the-art results, but is not an end-to-end deep-learning method. As such, new rules need to be written if different types of tables are encountered."
},
{
"label": "section_header",
"id": 8,
"page_no": 2,
"cluster": {
"id": 8,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 635.9,
"r": 105.2,
"b": 646.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 646.7,
"r_x1": 57.8,
"r_y1": 646.7,
"r_x2": 57.8,
"r_y2": 635.9,
"r_x3": 50.1,
"r_y3": 635.9,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.1,
"r_y0": 646.7,
"r_x1": 105.2,
"r_y1": 646.7,
"r_x2": 105.2,
"r_y2": 635.9,
"r_x3": 68.1,
"r_y3": 635.9,
"coord_origin": "TOPLEFT"
},
"text": "Datasets",
"orig": "Datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "3. Datasets"
},
{
"label": "text",
"id": 3,
"page_no": 2,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 50.1,
"t": 656.4,
"r": 286.4,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 665.3,
"r_x1": 286.4,
"r_y1": 665.3,
"r_x2": 286.4,
"r_y2": 656.4,
"r_x3": 62.1,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "We rely on large-scale datasets such as PubTabNet [37],",
"orig": "We rely on large-scale datasets such as PubTabNet [37],",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.3,
"r_x1": 286.4,
"r_y1": 677.3,
"r_x2": 286.4,
"r_y2": 668.4,
"r_x3": 50.1,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet [36], and TableBank [17] datasets to train and",
"orig": "FinTabNet [36], and TableBank [17] datasets to train and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 689.2,
"r_x1": 286.4,
"r_y1": 689.2,
"r_x2": 286.4,
"r_y2": 680.3,
"r_x3": 50.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "evaluate our models. These datasets span over various ap-",
"orig": "evaluate our models. These datasets span over various ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 166.2,
"r_y1": 701.2,
"r_x2": 166.2,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "pearance styles and content.",
"orig": "pearance styles and content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 173.7,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 173.7,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "We also introduce our own",
"orig": "We also introduce our own",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 286.4,
"r_y1": 713.2,
"r_x2": 286.4,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "synthetically generated SynthTabNet dataset to fix an im-",
"orig": "synthetically generated SynthTabNet dataset to fix an im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "We rely on large-scale datasets such as PubTabNet [37], FinTabNet [36], and TableBank [17] datasets to train and evaluate our models. These datasets span over various appearance styles and content. We also introduce our own synthetically generated SynthTabNet dataset to fix an im-"
},
{
"label": "picture",
"id": 6,
"page_no": 2,
"cluster": {
"id": 6,
"label": "picture",
"bbox": {
"l": 312.1,
"t": 78.4,
"r": 550.4,
"b": 250.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 380.8,
"r_y0": 88.6,
"r_x1": 486.8,
"r_y1": 88.6,
"r_x2": 486.8,
"r_y2": 79.8,
"r_x3": 380.8,
"r_y3": 79.8,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet + FinTabNet",
"orig": "PubTabNet + FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.8,
"r_y0": 250.8,
"r_x1": 469.8,
"r_y1": 250.8,
"r_x2": 469.8,
"r_y2": 242.0,
"r_x3": 396.8,
"r_y3": 242.0,
"coord_origin": "TOPLEFT"
},
"text": "Rows / Columns",
"orig": "Rows / Columns",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 321.0,
"r_y0": 239.3,
"r_x1": 324.8,
"r_y1": 239.3,
"r_x2": 324.8,
"r_y2": 233.4,
"r_x3": 321.0,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.5,
"r_y0": 239.3,
"r_x1": 418.1,
"r_y1": 239.3,
"r_x2": 418.1,
"r_y2": 233.4,
"r_x3": 410.5,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.8,
"r_y0": 239.3,
"r_x1": 508.5,
"r_y1": 239.3,
"r_x2": 508.5,
"r_y2": 233.4,
"r_x3": 500.8,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 365.3,
"r_y0": 239.3,
"r_x1": 372.9,
"r_y1": 239.3,
"r_x2": 372.9,
"r_y2": 233.4,
"r_x3": 365.3,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.7,
"r_y0": 239.3,
"r_x1": 463.3,
"r_y1": 239.3,
"r_x2": 463.3,
"r_y2": 233.4,
"r_x3": 455.7,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 542.0,
"r_y0": 239.3,
"r_x1": 549.7,
"r_y1": 239.3,
"r_x2": 549.7,
"r_y2": 233.4,
"r_x3": 542.0,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.0,
"r_y0": 236.3,
"r_x1": 319.9,
"r_y1": 236.3,
"r_x2": 319.9,
"r_y2": 230.4,
"r_x3": 316.0,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.6,
"r_y0": 204.5,
"r_x1": 316.4,
"r_y1": 204.5,
"r_x2": 316.4,
"r_y2": 198.7,
"r_x3": 312.6,
"r_y3": 198.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.4,
"r_y0": 204.5,
"r_x1": 320.3,
"r_y1": 204.5,
"r_x2": 320.3,
"r_y2": 198.7,
"r_x3": 316.4,
"r_y3": 198.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.1,
"r_y0": 173.9,
"r_x1": 317.0,
"r_y1": 173.9,
"r_x2": 317.0,
"r_y2": 168.1,
"r_x3": 313.1,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.0,
"r_y0": 173.9,
"r_x1": 320.8,
"r_y1": 173.9,
"r_x2": 320.8,
"r_y2": 168.1,
"r_x3": 317.0,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.9,
"r_y0": 142.4,
"r_x1": 316.7,
"r_y1": 142.4,
"r_x2": 316.7,
"r_y2": 136.6,
"r_x3": 312.9,
"r_y3": 136.6,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.7,
"r_y0": 142.4,
"r_x1": 320.6,
"r_y1": 142.4,
"r_x2": 320.6,
"r_y2": 136.6,
"r_x3": 316.7,
"r_y3": 136.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.5,
"r_y0": 111.4,
"r_x1": 316.3,
"r_y1": 111.4,
"r_x2": 316.3,
"r_y2": 105.6,
"r_x3": 312.5,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 111.4,
"r_x1": 320.1,
"r_y1": 111.4,
"r_x2": 320.1,
"r_y2": 105.6,
"r_x3": 316.3,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.5,
"r_y0": 218.1,
"r_x1": 316.3,
"r_y1": 218.1,
"r_x2": 316.3,
"r_y2": 212.3,
"r_x3": 312.5,
"r_y3": 212.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 218.1,
"r_x1": 320.1,
"r_y1": 218.1,
"r_x2": 320.1,
"r_y2": 212.3,
"r_x3": 316.3,
"r_y3": 212.3,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.1,
"r_y0": 189.6,
"r_x1": 316.9,
"r_y1": 189.6,
"r_x2": 316.9,
"r_y2": 183.7,
"r_x3": 313.1,
"r_y3": 183.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.9,
"r_y0": 189.6,
"r_x1": 320.7,
"r_y1": 189.6,
"r_x2": 320.7,
"r_y2": 183.7,
"r_x3": 316.9,
"r_y3": 183.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.8,
"r_y0": 158.3,
"r_x1": 316.6,
"r_y1": 158.3,
"r_x2": 316.6,
"r_y2": 152.5,
"r_x3": 312.8,
"r_y3": 152.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.6,
"r_y0": 158.3,
"r_x1": 320.4,
"r_y1": 158.3,
"r_x2": 320.4,
"r_y2": 152.5,
"r_x3": 316.6,
"r_y3": 152.5,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.2,
"r_y0": 126.4,
"r_x1": 316.0,
"r_y1": 126.4,
"r_x2": 316.0,
"r_y2": 120.6,
"r_x3": 312.2,
"r_y3": 120.6,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.0,
"r_y0": 126.4,
"r_x1": 319.8,
"r_y1": 126.4,
"r_x2": 319.8,
"r_y2": 120.6,
"r_x3": 316.0,
"r_y3": 120.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.8,
"r_y0": 95.9,
"r_x1": 316.6,
"r_y1": 95.9,
"r_x2": 316.6,
"r_y2": 90.1,
"r_x3": 312.8,
"r_y3": 90.1,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.6,
"r_y0": 95.9,
"r_x1": 320.4,
"r_y1": 95.9,
"r_x2": 320.4,
"r_y2": 90.1,
"r_x3": 316.6,
"r_y3": 90.1,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.2,
"r_y0": 230.0,
"r_x1": 536.9,
"r_y1": 230.0,
"r_x2": 536.9,
"r_y2": 222.7,
"r_x3": 532.2,
"r_y3": 222.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.9,
"r_y0": 115.6,
"r_x1": 547.6,
"r_y1": 115.6,
"r_x2": 547.6,
"r_y2": 108.3,
"r_x3": 532.9,
"r_y3": 108.3,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.8,
"r_y0": 138.1,
"r_x1": 542.7,
"r_y1": 138.1,
"r_x2": 542.7,
"r_y2": 130.8,
"r_x3": 532.8,
"r_y3": 130.8,
"coord_origin": "TOPLEFT"
},
"text": "8K",
"orig": "8K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.8,
"r_y0": 161.2,
"r_x1": 542.8,
"r_y1": 161.2,
"r_x2": 542.8,
"r_y2": 153.9,
"r_x3": 532.8,
"r_y3": 153.9,
"coord_origin": "TOPLEFT"
},
"text": "6K",
"orig": "6K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.6,
"r_y0": 184.0,
"r_x1": 542.5,
"r_y1": 184.0,
"r_x2": 542.5,
"r_y2": 176.8,
"r_x3": 532.6,
"r_y3": 176.8,
"coord_origin": "TOPLEFT"
},
"text": "4K",
"orig": "4K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.1,
"r_y0": 206.9,
"r_x1": 542.1,
"r_y1": 206.9,
"r_x2": 542.1,
"r_y2": 199.6,
"r_x3": 532.1,
"r_y3": 199.6,
"coord_origin": "TOPLEFT"
},
"text": "2K",
"orig": "2K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 12,
"label": "section_header",
"bbox": {
"l": 380.8,
"t": 79.8,
"r": 486.8,
"b": 88.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.57,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 380.8,
"r_y0": 88.6,
"r_x1": 486.8,
"r_y1": 88.6,
"r_x2": 486.8,
"r_y2": 79.8,
"r_x3": 380.8,
"r_y3": 79.8,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet + FinTabNet",
"orig": "PubTabNet + FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 16,
"label": "text",
"bbox": {
"l": 396.8,
"t": 242.0,
"r": 469.8,
"b": 250.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.8,
"r_y0": 250.8,
"r_x1": 469.8,
"r_y1": 250.8,
"r_x2": 469.8,
"r_y2": 242.0,
"r_x3": 396.8,
"r_y3": 242.0,
"coord_origin": "TOPLEFT"
},
"text": "Rows / Columns",
"orig": "Rows / Columns",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 17,
"label": "text",
"bbox": {
"l": 321.0,
"t": 233.4,
"r": 324.8,
"b": 239.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 321.0,
"r_y0": 239.3,
"r_x1": 324.8,
"r_y1": 239.3,
"r_x2": 324.8,
"r_y2": 233.4,
"r_x3": 321.0,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 18,
"label": "text",
"bbox": {
"l": 410.5,
"t": 233.4,
"r": 418.1,
"b": 239.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.5,
"r_y0": 239.3,
"r_x1": 418.1,
"r_y1": 239.3,
"r_x2": 418.1,
"r_y2": 233.4,
"r_x3": 410.5,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 19,
"label": "text",
"bbox": {
"l": 500.8,
"t": 233.4,
"r": 508.5,
"b": 239.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 500.8,
"r_y0": 239.3,
"r_x1": 508.5,
"r_y1": 239.3,
"r_x2": 508.5,
"r_y2": 233.4,
"r_x3": 500.8,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 20,
"label": "text",
"bbox": {
"l": 365.3,
"t": 233.4,
"r": 372.9,
"b": 239.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 365.3,
"r_y0": 239.3,
"r_x1": 372.9,
"r_y1": 239.3,
"r_x2": 372.9,
"r_y2": 233.4,
"r_x3": 365.3,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 21,
"label": "text",
"bbox": {
"l": 455.7,
"t": 233.4,
"r": 463.3,
"b": 239.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.7,
"r_y0": 239.3,
"r_x1": 463.3,
"r_y1": 239.3,
"r_x2": 463.3,
"r_y2": 233.4,
"r_x3": 455.7,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 22,
"label": "text",
"bbox": {
"l": 542.0,
"t": 233.4,
"r": 549.7,
"b": 239.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 542.0,
"r_y0": 239.3,
"r_x1": 549.7,
"r_y1": 239.3,
"r_x2": 549.7,
"r_y2": 233.4,
"r_x3": 542.0,
"r_y3": 233.4,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 23,
"label": "text",
"bbox": {
"l": 316.0,
"t": 230.4,
"r": 319.9,
"b": 236.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.0,
"r_y0": 236.3,
"r_x1": 319.9,
"r_y1": 236.3,
"r_x2": 319.9,
"r_y2": 230.4,
"r_x3": 316.0,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 24,
"label": "text",
"bbox": {
"l": 312.6,
"t": 198.7,
"r": 316.4,
"b": 204.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.6,
"r_y0": 204.5,
"r_x1": 316.4,
"r_y1": 204.5,
"r_x2": 316.4,
"r_y2": 198.7,
"r_x3": 312.6,
"r_y3": 198.7,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 25,
"label": "text",
"bbox": {
"l": 316.4,
"t": 198.7,
"r": 320.3,
"b": 204.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.4,
"r_y0": 204.5,
"r_x1": 320.3,
"r_y1": 204.5,
"r_x2": 320.3,
"r_y2": 198.7,
"r_x3": 316.4,
"r_y3": 198.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 26,
"label": "text",
"bbox": {
"l": 313.1,
"t": 168.1,
"r": 317.0,
"b": 173.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.1,
"r_y0": 173.9,
"r_x1": 317.0,
"r_y1": 173.9,
"r_x2": 317.0,
"r_y2": 168.1,
"r_x3": 313.1,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 27,
"label": "text",
"bbox": {
"l": 317.0,
"t": 168.1,
"r": 320.8,
"b": 173.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.0,
"r_y0": 173.9,
"r_x1": 320.8,
"r_y1": 173.9,
"r_x2": 320.8,
"r_y2": 168.1,
"r_x3": 317.0,
"r_y3": 168.1,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 28,
"label": "text",
"bbox": {
"l": 312.9,
"t": 136.6,
"r": 316.7,
"b": 142.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.9,
"r_y0": 142.4,
"r_x1": 316.7,
"r_y1": 142.4,
"r_x2": 316.7,
"r_y2": 136.6,
"r_x3": 312.9,
"r_y3": 136.6,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "text",
"bbox": {
"l": 316.7,
"t": 136.6,
"r": 320.6,
"b": 142.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.7,
"r_y0": 142.4,
"r_x1": 320.6,
"r_y1": 142.4,
"r_x2": 320.6,
"r_y2": 136.6,
"r_x3": 316.7,
"r_y3": 136.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 30,
"label": "text",
"bbox": {
"l": 312.5,
"t": 105.6,
"r": 316.3,
"b": 111.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.5,
"r_y0": 111.4,
"r_x1": 316.3,
"r_y1": 111.4,
"r_x2": 316.3,
"r_y2": 105.6,
"r_x3": 312.5,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "text",
"bbox": {
"l": 316.3,
"t": 105.6,
"r": 320.1,
"b": 111.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 111.4,
"r_x1": 320.1,
"r_y1": 111.4,
"r_x2": 320.1,
"r_y2": 105.6,
"r_x3": 316.3,
"r_y3": 105.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 32,
"label": "text",
"bbox": {
"l": 312.5,
"t": 212.3,
"r": 316.3,
"b": 218.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.5,
"r_y0": 218.1,
"r_x1": 316.3,
"r_y1": 218.1,
"r_x2": 316.3,
"r_y2": 212.3,
"r_x3": 312.5,
"r_y3": 212.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 33,
"label": "text",
"bbox": {
"l": 316.3,
"t": 212.3,
"r": 320.1,
"b": 218.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.3,
"r_y0": 218.1,
"r_x1": 320.1,
"r_y1": 218.1,
"r_x2": 320.1,
"r_y2": 212.3,
"r_x3": 316.3,
"r_y3": 212.3,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 34,
"label": "text",
"bbox": {
"l": 313.1,
"t": 183.7,
"r": 316.9,
"b": 189.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.1,
"r_y0": 189.6,
"r_x1": 316.9,
"r_y1": 189.6,
"r_x2": 316.9,
"r_y2": 183.7,
"r_x3": 313.1,
"r_y3": 183.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 35,
"label": "text",
"bbox": {
"l": 316.9,
"t": 183.7,
"r": 320.7,
"b": 189.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.9,
"r_y0": 189.6,
"r_x1": 320.7,
"r_y1": 189.6,
"r_x2": 320.7,
"r_y2": 183.7,
"r_x3": 316.9,
"r_y3": 183.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 36,
"label": "text",
"bbox": {
"l": 312.8,
"t": 152.5,
"r": 316.6,
"b": 158.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.8,
"r_y0": 158.3,
"r_x1": 316.6,
"r_y1": 158.3,
"r_x2": 316.6,
"r_y2": 152.5,
"r_x3": 312.8,
"r_y3": 152.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 37,
"label": "text",
"bbox": {
"l": 316.6,
"t": 152.5,
"r": 320.4,
"b": 158.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.6,
"r_y0": 158.3,
"r_x1": 320.4,
"r_y1": 158.3,
"r_x2": 320.4,
"r_y2": 152.5,
"r_x3": 316.6,
"r_y3": 152.5,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 38,
"label": "text",
"bbox": {
"l": 312.2,
"t": 120.6,
"r": 316.0,
"b": 126.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.2,
"r_y0": 126.4,
"r_x1": 316.0,
"r_y1": 126.4,
"r_x2": 316.0,
"r_y2": 120.6,
"r_x3": 312.2,
"r_y3": 120.6,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 39,
"label": "text",
"bbox": {
"l": 316.0,
"t": 120.6,
"r": 319.8,
"b": 126.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.0,
"r_y0": 126.4,
"r_x1": 319.8,
"r_y1": 126.4,
"r_x2": 319.8,
"r_y2": 120.6,
"r_x3": 316.0,
"r_y3": 120.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 40,
"label": "text",
"bbox": {
"l": 312.8,
"t": 90.1,
"r": 316.6,
"b": 95.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.8,
"r_y0": 95.9,
"r_x1": 316.6,
"r_y1": 95.9,
"r_x2": 316.6,
"r_y2": 90.1,
"r_x3": 312.8,
"r_y3": 90.1,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 316.6,
"t": 90.1,
"r": 320.4,
"b": 95.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.6,
"r_y0": 95.9,
"r_x1": 320.4,
"r_y1": 95.9,
"r_x2": 320.4,
"r_y2": 90.1,
"r_x3": 316.6,
"r_y3": 90.1,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 532.2,
"t": 222.7,
"r": 536.9,
"b": 230.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.2,
"r_y0": 230.0,
"r_x1": 536.9,
"r_y1": 230.0,
"r_x2": 536.9,
"r_y2": 222.7,
"r_x3": 532.2,
"r_y3": 222.7,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 532.9,
"t": 108.3,
"r": 547.6,
"b": 115.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.9,
"r_y0": 115.6,
"r_x1": 547.6,
"r_y1": 115.6,
"r_x2": 547.6,
"r_y2": 108.3,
"r_x3": 532.9,
"r_y3": 108.3,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 532.8,
"t": 130.8,
"r": 542.7,
"b": 138.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.8,
"r_y0": 138.1,
"r_x1": 542.7,
"r_y1": 138.1,
"r_x2": 542.7,
"r_y2": 130.8,
"r_x3": 532.8,
"r_y3": 130.8,
"coord_origin": "TOPLEFT"
},
"text": "8K",
"orig": "8K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 532.8,
"t": 153.9,
"r": 542.8,
"b": 161.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.8,
"r_y0": 161.2,
"r_x1": 542.8,
"r_y1": 161.2,
"r_x2": 542.8,
"r_y2": 153.9,
"r_x3": 532.8,
"r_y3": 153.9,
"coord_origin": "TOPLEFT"
},
"text": "6K",
"orig": "6K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 532.6,
"t": 176.8,
"r": 542.5,
"b": 184.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.6,
"r_y0": 184.0,
"r_x1": 542.5,
"r_y1": 184.0,
"r_x2": 542.5,
"r_y2": 176.8,
"r_x3": 532.6,
"r_y3": 176.8,
"coord_origin": "TOPLEFT"
},
"text": "4K",
"orig": "4K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 532.1,
"t": 199.6,
"r": 542.1,
"b": 206.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.1,
"r_y0": 206.9,
"r_x1": 542.1,
"r_y1": 206.9,
"r_x2": 542.1,
"r_y2": 199.6,
"r_x3": 532.1,
"r_y3": 199.6,
"coord_origin": "TOPLEFT"
},
"text": "2K",
"orig": "2K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "caption",
"id": 7,
"page_no": 2,
"cluster": {
"id": 7,
"label": "caption",
"bbox": {
"l": 308.9,
"t": 267.8,
"r": 545.1,
"b": 288.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 276.7,
"r_x1": 346.1,
"r_y1": 276.7,
"r_x2": 346.1,
"r_y2": 267.8,
"r_x3": 308.9,
"r_y3": 267.8,
"coord_origin": "TOPLEFT"
},
"text": "Figure 2:",
"orig": "Figure 2:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.5,
"r_y0": 276.7,
"r_x1": 545.1,
"r_y1": 276.7,
"r_x2": 545.1,
"r_y2": 267.8,
"r_x3": 354.5,
"r_y3": 267.8,
"coord_origin": "TOPLEFT"
},
"text": "Distribution of the tables across different table",
"orig": "Distribution of the tables across different table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 288.7,
"r_x1": 498.6,
"r_y1": 288.7,
"r_x2": 498.6,
"r_y2": 279.8,
"r_x3": 308.9,
"r_y3": 279.8,
"coord_origin": "TOPLEFT"
},
"text": "dimensions in PubTabNet + FinTabNet datasets",
"orig": "dimensions in PubTabNet + FinTabNet datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 2: Distribution of the tables across different table dimensions in PubTabNet + FinTabNet datasets"
},
{
"label": "text",
"id": 9,
"page_no": 2,
"cluster": {
"id": 9,
"label": "text",
"bbox": {
"l": 308.9,
"t": 317.5,
"r": 437.3,
"b": 326.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 326.4,
"r_x1": 437.3,
"r_y1": 326.4,
"r_x2": 437.3,
"r_y2": 317.5,
"r_x3": 308.9,
"r_y3": 317.5,
"coord_origin": "TOPLEFT"
},
"text": "balance in the previous datasets.",
"orig": "balance in the previous datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "balance in the previous datasets."
},
{
"label": "text",
"id": 2,
"page_no": 2,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 308.9,
"t": 331.5,
"r": 545.1,
"b": 627.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 340.4,
"r_x1": 545.1,
"r_y1": 340.4,
"r_x2": 545.1,
"r_y2": 331.5,
"r_x3": 320.8,
"r_y3": 331.5,
"coord_origin": "TOPLEFT"
},
"text": "The PubTabNet dataset contains 509k tables delivered as",
"orig": "The PubTabNet dataset contains 509k tables delivered as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 352.4,
"r_x1": 545.1,
"r_y1": 352.4,
"r_x2": 545.1,
"r_y2": 343.5,
"r_x3": 308.9,
"r_y3": 343.5,
"coord_origin": "TOPLEFT"
},
"text": "annotated PNG images. The annotations consist of the table",
"orig": "annotated PNG images. The annotations consist of the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 364.3,
"r_x1": 545.1,
"r_y1": 364.3,
"r_x2": 545.1,
"r_y2": 355.4,
"r_x3": 308.9,
"r_y3": 355.4,
"coord_origin": "TOPLEFT"
},
"text": "structure represented in HTML format, the tokenized text",
"orig": "structure represented in HTML format, the tokenized text",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 376.3,
"r_x1": 545.1,
"r_y1": 376.3,
"r_x2": 545.1,
"r_y2": 367.4,
"r_x3": 308.9,
"r_y3": 367.4,
"coord_origin": "TOPLEFT"
},
"text": "and its bounding boxes per table cell. Fig. 1 shows the ap-",
"orig": "and its bounding boxes per table cell. Fig. 1 shows the ap-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 388.3,
"r_x1": 545.1,
"r_y1": 388.3,
"r_x2": 545.1,
"r_y2": 379.4,
"r_x3": 308.9,
"r_y3": 379.4,
"coord_origin": "TOPLEFT"
},
"text": "pearance style of PubTabNet. Depending on its complexity,",
"orig": "pearance style of PubTabNet. Depending on its complexity,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 400.2,
"r_x1": 545.1,
"r_y1": 400.2,
"r_x2": 545.1,
"r_y2": 391.3,
"r_x3": 308.9,
"r_y3": 391.3,
"coord_origin": "TOPLEFT"
},
"text": "a table is characterized as \u201csimple\u201d when it does not contain",
"orig": "a table is characterized as \u201csimple\u201d when it does not contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 412.2,
"r_x1": 545.1,
"r_y1": 412.2,
"r_x2": 545.1,
"r_y2": 403.3,
"r_x3": 308.9,
"r_y3": 403.3,
"coord_origin": "TOPLEFT"
},
"text": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The",
"orig": "row spans or column spans, otherwise it is \u201ccomplex\u201d. The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 424.1,
"r_x1": 545.1,
"r_y1": 424.1,
"r_x2": 545.1,
"r_y2": 415.2,
"r_x3": 308.9,
"r_y3": 415.2,
"coord_origin": "TOPLEFT"
},
"text": "dataset is divided into Train and Val splits (roughly 98% and",
"orig": "dataset is divided into Train and Val splits (roughly 98% and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 436.1,
"r_x1": 545.1,
"r_y1": 436.1,
"r_x2": 545.1,
"r_y2": 427.2,
"r_x3": 308.9,
"r_y3": 427.2,
"coord_origin": "TOPLEFT"
},
"text": "2%). The Train split consists of 54% simple and 46% com-",
"orig": "2%). The Train split consists of 54% simple and 46% com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 448.0,
"r_x1": 545.1,
"r_y1": 448.0,
"r_x2": 545.1,
"r_y2": 439.1,
"r_x3": 308.9,
"r_y3": 439.1,
"coord_origin": "TOPLEFT"
},
"text": "plex tables and the Val split of 51% and 49% respectively.",
"orig": "plex tables and the Val split of 51% and 49% respectively.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 460.0,
"r_x1": 545.1,
"r_y1": 460.0,
"r_x2": 545.1,
"r_y2": 451.1,
"r_x3": 308.9,
"r_y3": 451.1,
"coord_origin": "TOPLEFT"
},
"text": "The FinTabNet dataset contains 112k tables delivered as",
"orig": "The FinTabNet dataset contains 112k tables delivered as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 471.9,
"r_x1": 545.1,
"r_y1": 471.9,
"r_x2": 545.1,
"r_y2": 463.0,
"r_x3": 308.9,
"r_y3": 463.0,
"coord_origin": "TOPLEFT"
},
"text": "single-page PDF documents with mixed table structures and",
"orig": "single-page PDF documents with mixed table structures and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 483.9,
"r_x1": 545.1,
"r_y1": 483.9,
"r_x2": 545.1,
"r_y2": 475.0,
"r_x3": 308.9,
"r_y3": 475.0,
"coord_origin": "TOPLEFT"
},
"text": "text content. Similarly to the PubTabNet, the annotations",
"orig": "text content. Similarly to the PubTabNet, the annotations",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 495.9,
"r_x1": 545.1,
"r_y1": 495.9,
"r_x2": 545.1,
"r_y2": 486.9,
"r_x3": 308.9,
"r_y3": 486.9,
"coord_origin": "TOPLEFT"
},
"text": "of FinTabNet include the table structure in HTML, the to-",
"orig": "of FinTabNet include the table structure in HTML, the to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 507.8,
"r_x1": 545.1,
"r_y1": 507.8,
"r_x2": 545.1,
"r_y2": 498.9,
"r_x3": 308.9,
"r_y3": 498.9,
"coord_origin": "TOPLEFT"
},
"text": "kenized text and the bounding boxes on a table cell basis.",
"orig": "kenized text and the bounding boxes on a table cell basis.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 519.8,
"r_x1": 545.1,
"r_y1": 519.8,
"r_x2": 545.1,
"r_y2": 510.9,
"r_x3": 308.9,
"r_y3": 510.9,
"coord_origin": "TOPLEFT"
},
"text": "The dataset is divided into Train, Test and Val splits (81%,",
"orig": "The dataset is divided into Train, Test and Val splits (81%,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 531.7,
"r_x1": 545.1,
"r_y1": 531.7,
"r_x2": 545.1,
"r_y2": 522.8,
"r_x3": 308.9,
"r_y3": 522.8,
"coord_origin": "TOPLEFT"
},
"text": "9.5%, 9.5%), and each one is almost equally divided into",
"orig": "9.5%, 9.5%), and each one is almost equally divided into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 543.7,
"r_x1": 545.1,
"r_y1": 543.7,
"r_x2": 545.1,
"r_y2": 534.8,
"r_x3": 308.9,
"r_y3": 534.8,
"coord_origin": "TOPLEFT"
},
"text": "simple and complex tables (Train: 48% simple, 52% com-",
"orig": "simple and complex tables (Train: 48% simple, 52% com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 555.6,
"r_x1": 545.1,
"r_y1": 555.6,
"r_x2": 545.1,
"r_y2": 546.7,
"r_x3": 308.9,
"r_y3": 546.7,
"coord_origin": "TOPLEFT"
},
"text": "plex, Test: 48% simple, 52% complex, Test: 53% simple,",
"orig": "plex, Test: 48% simple, 52% complex, Test: 53% simple,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 567.6,
"r_x1": 545.1,
"r_y1": 567.6,
"r_x2": 545.1,
"r_y2": 558.7,
"r_x3": 308.9,
"r_y3": 558.7,
"coord_origin": "TOPLEFT"
},
"text": "47% complex). Finally the TableBank dataset consists of",
"orig": "47% complex). Finally the TableBank dataset consists of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 579.5,
"r_x1": 545.1,
"r_y1": 579.5,
"r_x2": 545.1,
"r_y2": 570.6,
"r_x3": 308.9,
"r_y3": 570.6,
"coord_origin": "TOPLEFT"
},
"text": "145k tables provided as JPEG images. The latter has anno-",
"orig": "145k tables provided as JPEG images. The latter has anno-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 591.5,
"r_x1": 545.1,
"r_y1": 591.5,
"r_x2": 545.1,
"r_y2": 582.6,
"r_x3": 308.9,
"r_y3": 582.6,
"coord_origin": "TOPLEFT"
},
"text": "tations for the table structure, but only few with bounding",
"orig": "tations for the table structure, but only few with bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 603.5,
"r_x1": 545.1,
"r_y1": 603.5,
"r_x2": 545.1,
"r_y2": 594.5,
"r_x3": 308.9,
"r_y3": 594.5,
"coord_origin": "TOPLEFT"
},
"text": "boxes of the table cells. The entire dataset consists of sim-",
"orig": "boxes of the table cells. The entire dataset consists of sim-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 615.4,
"r_x1": 545.1,
"r_y1": 615.4,
"r_x2": 545.1,
"r_y2": 606.5,
"r_x3": 308.9,
"r_y3": 606.5,
"coord_origin": "TOPLEFT"
},
"text": "ple tables and it is divided into 90% Train, 3% Test and 7%",
"orig": "ple tables and it is divided into 90% Train, 3% Test and 7%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 627.4,
"r_x1": 348.2,
"r_y1": 627.4,
"r_x2": 348.2,
"r_y2": 618.5,
"r_x3": 308.9,
"r_y3": 618.5,
"coord_origin": "TOPLEFT"
},
"text": "Val splits.",
"orig": "Val splits.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The PubTabNet dataset contains 509k tables delivered as annotated PNG images. The annotations consist of the table structure represented in HTML format, the tokenized text and its bounding boxes per table cell. Fig. 1 shows the appearance style of PubTabNet. Depending on its complexity, a table is characterized as \"simple\" when it does not contain row spans or column spans, otherwise it is \"complex\". The dataset is divided into Train and Val splits (roughly 98% and 2%). The Train split consists of 54% simple and 46% complex tables and the Val split of 51% and 49% respectively. The FinTabNet dataset contains 112k tables delivered as single-page PDF documents with mixed table structures and text content. Similarly to the PubTabNet, the annotations of FinTabNet include the table structure in HTML, the tokenized text and the bounding boxes on a table cell basis. The dataset is divided into Train, Test and Val splits (81%, 9.5%, 9.5%), and each one is almost equally divided into simple and complex tables (Train: 48% simple, 52% complex, Test: 48% simple, 52% complex, Test: 53% simple, 47% complex). Finally the TableBank dataset consists of 145k tables provided as JPEG images. The latter has annotations for the table structure, but only few with bounding boxes of the table cells. The entire dataset consists of simple tables and it is divided into 90% Train, 3% Test and 7% Val splits."
},
{
"label": "text",
"id": 4,
"page_no": 2,
"cluster": {
"id": 4,
"label": "text",
"bbox": {
"l": 308.9,
"t": 632.5,
"r": 545.1,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 641.4,
"r_x1": 545.1,
"r_y1": 641.4,
"r_x2": 545.1,
"r_y2": 632.5,
"r_x3": 320.8,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": "Due to the heterogeneity across the dataset formats, it",
"orig": "Due to the heterogeneity across the dataset formats, it",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 653.4,
"r_x1": 545.1,
"r_y1": 653.4,
"r_x2": 545.1,
"r_y2": 644.5,
"r_x3": 308.9,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "was necessary to combine all available data into one homog-",
"orig": "was necessary to combine all available data into one homog-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 665.3,
"r_x1": 545.1,
"r_y1": 665.3,
"r_x2": 545.1,
"r_y2": 656.4,
"r_x3": 308.9,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "enized dataset before we could train our models for practi-",
"orig": "enized dataset before we could train our models for practi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 677.3,
"r_x1": 545.1,
"r_y1": 677.3,
"r_x2": 545.1,
"r_y2": 668.4,
"r_x3": 308.9,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "cal purposes. Given the size of PubTabNet, we adopted its",
"orig": "cal purposes. Given the size of PubTabNet, we adopted its",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 689.2,
"r_x1": 545.1,
"r_y1": 689.2,
"r_x2": 545.1,
"r_y2": 680.3,
"r_x3": 308.9,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "annotation format and we extracted and converted all tables",
"orig": "annotation format and we extracted and converted all tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 308.9,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "as PNG images with a resolution of 72 dpi. Additionally,",
"orig": "as PNG images with a resolution of 72 dpi. Additionally,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 545.1,
"r_y1": 713.2,
"r_x2": 545.1,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "we have filtered out tables with extreme sizes due to small",
"orig": "we have filtered out tables with extreme sizes due to small",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Due to the heterogeneity across the dataset formats, it was necessary to combine all available data into one homogenized dataset before we could train our models for practical purposes. Given the size of PubTabNet, we adopted its annotation format and we extracted and converted all tables as PNG images with a resolution of 72 dpi. Additionally, we have filtered out tables with extreme sizes due to small"
}
],
"headers": [
{
"label": "page_footer",
"id": 11,
"page_no": 2,
"cluster": {
"id": 11,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.87,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "3"
}
]
}
},
{
"page_no": 3,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.1,
"r_x1": 286.4,
"r_y1": 84.1,
"r_x2": 286.4,
"r_y2": 75.2,
"r_x3": 50.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "amount of such tables, and kept only those ones ranging",
"orig": "amount of such tables, and kept only those ones ranging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 96.1,
"r_x1": 212.3,
"r_y1": 96.1,
"r_x2": 212.3,
"r_y2": 87.2,
"r_x3": 50.1,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "between 1*1 and 20*10 (rows/columns).",
"orig": "between 1*1 and 20*10 (rows/columns).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 109.9,
"r_x1": 286.4,
"r_y1": 109.9,
"r_x2": 286.4,
"r_y2": 101.0,
"r_x3": 62.1,
"r_y3": 101.0,
"coord_origin": "TOPLEFT"
},
"text": "The availability of the bounding boxes for all table cells",
"orig": "The availability of the bounding boxes for all table cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 121.8,
"r_x1": 286.4,
"r_y1": 121.8,
"r_x2": 286.4,
"r_y2": 112.9,
"r_x3": 50.1,
"r_y3": 112.9,
"coord_origin": "TOPLEFT"
},
"text": "is essential to train our models. In order to distinguish be-",
"orig": "is essential to train our models. In order to distinguish be-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 133.8,
"r_x1": 286.4,
"r_y1": 133.8,
"r_x2": 286.4,
"r_y2": 124.9,
"r_x3": 50.1,
"r_y3": 124.9,
"coord_origin": "TOPLEFT"
},
"text": "tween empty and non-empty bounding boxes, we have in-",
"orig": "tween empty and non-empty bounding boxes, we have in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 145.7,
"r_x1": 286.4,
"r_y1": 145.7,
"r_x2": 286.4,
"r_y2": 136.8,
"r_x3": 50.1,
"r_y3": 136.8,
"coord_origin": "TOPLEFT"
},
"text": "troduced a binary class in the annotation. Unfortunately, the",
"orig": "troduced a binary class in the annotation. Unfortunately, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 157.7,
"r_x1": 286.4,
"r_y1": 157.7,
"r_x2": 286.4,
"r_y2": 148.8,
"r_x3": 50.1,
"r_y3": 148.8,
"coord_origin": "TOPLEFT"
},
"text": "original datasets either omit the bounding boxes for whole",
"orig": "original datasets either omit the bounding boxes for whole",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 169.6,
"r_x1": 286.4,
"r_y1": 169.6,
"r_x2": 286.4,
"r_y2": 160.7,
"r_x3": 50.1,
"r_y3": 160.7,
"coord_origin": "TOPLEFT"
},
"text": "tables (e.g. TableBank) or they narrow their scope only to",
"orig": "tables (e.g. TableBank) or they narrow their scope only to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 181.6,
"r_x1": 286.4,
"r_y1": 181.6,
"r_x2": 286.4,
"r_y2": 172.7,
"r_x3": 50.1,
"r_y3": 172.7,
"coord_origin": "TOPLEFT"
},
"text": "non-empty cells. Therefore, it was imperative to introduce",
"orig": "non-empty cells. Therefore, it was imperative to introduce",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 193.6,
"r_x1": 286.4,
"r_y1": 193.6,
"r_x2": 286.4,
"r_y2": 184.6,
"r_x3": 50.1,
"r_y3": 184.6,
"coord_origin": "TOPLEFT"
},
"text": "a data pre-processing procedure that generates the missing",
"orig": "a data pre-processing procedure that generates the missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 205.5,
"r_x1": 286.4,
"r_y1": 205.5,
"r_x2": 286.4,
"r_y2": 196.6,
"r_x3": 50.1,
"r_y3": 196.6,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes out of the annotation information. This pro-",
"orig": "bounding boxes out of the annotation information. This pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 217.5,
"r_x1": 286.4,
"r_y1": 217.5,
"r_x2": 286.4,
"r_y2": 208.6,
"r_x3": 50.1,
"r_y3": 208.6,
"coord_origin": "TOPLEFT"
},
"text": "cedure first parses the provided table structure and calcu-",
"orig": "cedure first parses the provided table structure and calcu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 229.4,
"r_x1": 286.4,
"r_y1": 229.4,
"r_x2": 286.4,
"r_y2": 220.5,
"r_x3": 50.1,
"r_y3": 220.5,
"coord_origin": "TOPLEFT"
},
"text": "lates the dimensions of the most fine-grained grid that cov-",
"orig": "lates the dimensions of the most fine-grained grid that cov-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 241.4,
"r_x1": 286.4,
"r_y1": 241.4,
"r_x2": 286.4,
"r_y2": 232.5,
"r_x3": 50.1,
"r_y3": 232.5,
"coord_origin": "TOPLEFT"
},
"text": "ers the table structure. Notice that each table cell may oc-",
"orig": "ers the table structure. Notice that each table cell may oc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 253.3,
"r_x1": 286.4,
"r_y1": 253.3,
"r_x2": 286.4,
"r_y2": 244.4,
"r_x3": 50.1,
"r_y3": 244.4,
"coord_origin": "TOPLEFT"
},
"text": "cupy multiple grid squares due to row or column spans. In",
"orig": "cupy multiple grid squares due to row or column spans. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 265.3,
"r_x1": 286.4,
"r_y1": 265.3,
"r_x2": 286.4,
"r_y2": 256.4,
"r_x3": 50.1,
"r_y3": 256.4,
"coord_origin": "TOPLEFT"
},
"text": "case of PubTabNet we had to compute missing bounding",
"orig": "case of PubTabNet we had to compute missing bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 277.2,
"r_x1": 286.4,
"r_y1": 277.2,
"r_x2": 286.4,
"r_y2": 268.3,
"r_x3": 50.1,
"r_y3": 268.3,
"coord_origin": "TOPLEFT"
},
"text": "boxes for 48% of the simple and 69% of the complex ta-",
"orig": "boxes for 48% of the simple and 69% of the complex ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 289.2,
"r_x1": 68.7,
"r_y1": 289.2,
"r_x2": 68.7,
"r_y2": 280.3,
"r_x3": 50.1,
"r_y3": 280.3,
"coord_origin": "TOPLEFT"
},
"text": "bles.",
"orig": "bles.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 75.6,
"r_y0": 289.2,
"r_x1": 286.4,
"r_y1": 289.2,
"r_x2": 286.4,
"r_y2": 280.3,
"r_x3": 75.6,
"r_y3": 280.3,
"coord_origin": "TOPLEFT"
},
"text": "Regarding FinTabNet, 68% of the simple and 98%",
"orig": "Regarding FinTabNet, 68% of the simple and 98%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 301.2,
"r_x1": 286.4,
"r_y1": 301.2,
"r_x2": 286.4,
"r_y2": 292.2,
"r_x3": 50.1,
"r_y3": 292.2,
"coord_origin": "TOPLEFT"
},
"text": "of the complex tables require the generation of bounding",
"orig": "of the complex tables require the generation of bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 313.1,
"r_x1": 75.7,
"r_y1": 313.1,
"r_x2": 75.7,
"r_y2": 304.2,
"r_x3": 50.1,
"r_y3": 304.2,
"coord_origin": "TOPLEFT"
},
"text": "boxes.",
"orig": "boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 326.9,
"r_x1": 286.4,
"r_y1": 326.9,
"r_x2": 286.4,
"r_y2": 318.0,
"r_x3": 62.1,
"r_y3": 318.0,
"coord_origin": "TOPLEFT"
},
"text": "As it is illustrated in Fig. 2, the table distributions from",
"orig": "As it is illustrated in Fig. 2, the table distributions from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 338.9,
"r_x1": 286.4,
"r_y1": 338.9,
"r_x2": 286.4,
"r_y2": 330.0,
"r_x3": 50.1,
"r_y3": 330.0,
"coord_origin": "TOPLEFT"
},
"text": "all datasets are skewed towards simpler structures with",
"orig": "all datasets are skewed towards simpler structures with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 350.8,
"r_x1": 286.4,
"r_y1": 350.8,
"r_x2": 286.4,
"r_y2": 341.9,
"r_x3": 50.1,
"r_y3": 341.9,
"coord_origin": "TOPLEFT"
},
"text": "fewer number of rows/columns. Additionally, there is very",
"orig": "fewer number of rows/columns. Additionally, there is very",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 362.8,
"r_x1": 286.4,
"r_y1": 362.8,
"r_x2": 286.4,
"r_y2": 353.9,
"r_x3": 50.1,
"r_y3": 353.9,
"coord_origin": "TOPLEFT"
},
"text": "limited variance in the table styles, which in case of Pub-",
"orig": "limited variance in the table styles, which in case of Pub-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 374.7,
"r_x1": 286.4,
"r_y1": 374.7,
"r_x2": 286.4,
"r_y2": 365.8,
"r_x3": 50.1,
"r_y3": 365.8,
"coord_origin": "TOPLEFT"
},
"text": "TabNet and FinTabNet means one styling format for the",
"orig": "TabNet and FinTabNet means one styling format for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 386.7,
"r_x1": 141.6,
"r_y1": 386.7,
"r_x2": 141.6,
"r_y2": 377.8,
"r_x3": 50.1,
"r_y3": 377.8,
"coord_origin": "TOPLEFT"
},
"text": "majority of the tables.",
"orig": "majority of the tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 148.7,
"r_y0": 386.7,
"r_x1": 286.4,
"r_y1": 386.7,
"r_x2": 286.4,
"r_y2": 377.8,
"r_x3": 148.7,
"r_y3": 377.8,
"coord_origin": "TOPLEFT"
},
"text": "Similar limitations appear also in",
"orig": "Similar limitations appear also in",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 398.6,
"r_x1": 286.4,
"r_y1": 398.6,
"r_x2": 286.4,
"r_y2": 389.7,
"r_x3": 50.1,
"r_y3": 389.7,
"coord_origin": "TOPLEFT"
},
"text": "the type of table content, which in some cases (e.g. FinTab-",
"orig": "the type of table content, which in some cases (e.g. FinTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 410.6,
"r_x1": 286.4,
"r_y1": 410.6,
"r_x2": 286.4,
"r_y2": 401.7,
"r_x3": 50.1,
"r_y3": 401.7,
"coord_origin": "TOPLEFT"
},
"text": "Net) is restricted to a certain domain. Ultimately, the lack",
"orig": "Net) is restricted to a certain domain. Ultimately, the lack",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 422.5,
"r_x1": 286.4,
"r_y1": 422.5,
"r_x2": 286.4,
"r_y2": 413.6,
"r_x3": 50.1,
"r_y3": 413.6,
"coord_origin": "TOPLEFT"
},
"text": "of diversity in the training dataset damages the ability of the",
"orig": "of diversity in the training dataset damages the ability of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 434.5,
"r_x1": 216.4,
"r_y1": 434.5,
"r_x2": 216.4,
"r_y2": 425.6,
"r_x3": 50.1,
"r_y3": 425.6,
"coord_origin": "TOPLEFT"
},
"text": "models to generalize well on unseen data.",
"orig": "models to generalize well on unseen data.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 448.3,
"r_x1": 286.4,
"r_y1": 448.3,
"r_x2": 286.4,
"r_y2": 439.4,
"r_x3": 62.1,
"r_y3": 439.4,
"coord_origin": "TOPLEFT"
},
"text": "Motivated by those observations we aimed at generating",
"orig": "Motivated by those observations we aimed at generating",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 460.3,
"r_x1": 172.1,
"r_y1": 460.3,
"r_x2": 172.1,
"r_y2": 451.3,
"r_x3": 50.1,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": "a synthetic table dataset named",
"orig": "a synthetic table dataset named",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 174.1,
"r_y0": 460.0,
"r_x1": 224.7,
"r_y1": 460.0,
"r_x2": 224.7,
"r_y2": 451.4,
"r_x3": 174.1,
"r_y3": 451.4,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 224.7,
"r_y0": 460.3,
"r_x1": 286.4,
"r_y1": 460.3,
"r_x2": 286.4,
"r_y2": 451.3,
"r_x3": 224.7,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": ". This approach",
"orig": ". This approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 472.2,
"r_x1": 286.4,
"r_y1": 472.2,
"r_x2": 286.4,
"r_y2": 463.3,
"r_x3": 50.1,
"r_y3": 463.3,
"coord_origin": "TOPLEFT"
},
"text": "offers control over: 1) the size of the dataset, 2) the table",
"orig": "offers control over: 1) the size of the dataset, 2) the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 484.2,
"r_x1": 286.4,
"r_y1": 484.2,
"r_x2": 286.4,
"r_y2": 475.3,
"r_x3": 50.1,
"r_y3": 475.3,
"coord_origin": "TOPLEFT"
},
"text": "structure, 3) the table style and 4) the type of content. The",
"orig": "structure, 3) the table style and 4) the type of content. The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 496.1,
"r_x1": 286.4,
"r_y1": 496.1,
"r_x2": 286.4,
"r_y2": 487.2,
"r_x3": 50.1,
"r_y3": 487.2,
"coord_origin": "TOPLEFT"
},
"text": "complexity of the table structure is described by the size of",
"orig": "complexity of the table structure is described by the size of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 508.1,
"r_x1": 286.4,
"r_y1": 508.1,
"r_x2": 286.4,
"r_y2": 499.2,
"r_x3": 50.1,
"r_y3": 499.2,
"coord_origin": "TOPLEFT"
},
"text": "the table header and the table body, as well as the percentage",
"orig": "the table header and the table body, as well as the percentage",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 520.0,
"r_x1": 286.4,
"r_y1": 520.0,
"r_x2": 286.4,
"r_y2": 511.1,
"r_x3": 50.1,
"r_y3": 511.1,
"coord_origin": "TOPLEFT"
},
"text": "of the table cells covered by row spans and column spans.",
"orig": "of the table cells covered by row spans and column spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 532.0,
"r_x1": 286.4,
"r_y1": 532.0,
"r_x2": 286.4,
"r_y2": 523.1,
"r_x3": 50.1,
"r_y3": 523.1,
"coord_origin": "TOPLEFT"
},
"text": "A set of carefully designed styling templates provides the",
"orig": "A set of carefully designed styling templates provides the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 543.9,
"r_x1": 286.4,
"r_y1": 543.9,
"r_x2": 286.4,
"r_y2": 535.0,
"r_x3": 50.1,
"r_y3": 535.0,
"coord_origin": "TOPLEFT"
},
"text": "basis to build a wide range of table appearances. Lastly, the",
"orig": "basis to build a wide range of table appearances. Lastly, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 555.9,
"r_x1": 286.4,
"r_y1": 555.9,
"r_x2": 286.4,
"r_y2": 547.0,
"r_x3": 50.1,
"r_y3": 547.0,
"coord_origin": "TOPLEFT"
},
"text": "table content is generated out of a curated collection of text",
"orig": "table content is generated out of a curated collection of text",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 567.8,
"r_x1": 286.4,
"r_y1": 567.8,
"r_x2": 286.4,
"r_y2": 558.9,
"r_x3": 50.1,
"r_y3": 558.9,
"coord_origin": "TOPLEFT"
},
"text": "corpora. By controlling the size and scope of the synthetic",
"orig": "corpora. By controlling the size and scope of the synthetic",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 579.8,
"r_x1": 286.4,
"r_y1": 579.8,
"r_x2": 286.4,
"r_y2": 570.9,
"r_x3": 50.1,
"r_y3": 570.9,
"coord_origin": "TOPLEFT"
},
"text": "datasets we are able to train and evaluate our models in a",
"orig": "datasets we are able to train and evaluate our models in a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 591.8,
"r_x1": 286.4,
"r_y1": 591.8,
"r_x2": 286.4,
"r_y2": 582.9,
"r_x3": 50.1,
"r_y3": 582.9,
"coord_origin": "TOPLEFT"
},
"text": "variety of different conditions. For example, we can first",
"orig": "variety of different conditions. For example, we can first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 603.7,
"r_x1": 286.4,
"r_y1": 603.7,
"r_x2": 286.4,
"r_y2": 594.8,
"r_x3": 50.1,
"r_y3": 594.8,
"coord_origin": "TOPLEFT"
},
"text": "generate a highly diverse dataset to train our models and",
"orig": "generate a highly diverse dataset to train our models and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 615.7,
"r_x1": 286.4,
"r_y1": 615.7,
"r_x2": 286.4,
"r_y2": 606.8,
"r_x3": 50.1,
"r_y3": 606.8,
"coord_origin": "TOPLEFT"
},
"text": "then evaluate their performance on other synthetic datasets",
"orig": "then evaluate their performance on other synthetic datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 627.6,
"r_x1": 209.8,
"r_y1": 627.6,
"r_x2": 209.8,
"r_y2": 618.7,
"r_x3": 50.1,
"r_y3": 618.7,
"coord_origin": "TOPLEFT"
},
"text": "which are focused on a specific domain.",
"orig": "which are focused on a specific domain.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 641.4,
"r_x1": 286.4,
"r_y1": 641.4,
"r_x2": 286.4,
"r_y2": 632.5,
"r_x3": 62.1,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": "In this regard, we have prepared four synthetic datasets,",
"orig": "In this regard, we have prepared four synthetic datasets,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 653.4,
"r_x1": 286.4,
"r_y1": 653.4,
"r_x2": 286.4,
"r_y2": 644.5,
"r_x3": 50.1,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "each one containing 150k examples. The corpora to gener-",
"orig": "each one containing 150k examples. The corpora to gener-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 665.3,
"r_x1": 286.4,
"r_y1": 665.3,
"r_x2": 286.4,
"r_y2": 656.4,
"r_x3": 50.1,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "ate the table text consists of the most frequent terms appear-",
"orig": "ate the table text consists of the most frequent terms appear-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.3,
"r_x1": 286.4,
"r_y1": 677.3,
"r_x2": 286.4,
"r_y2": 668.4,
"r_x3": 50.1,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "ing in PubTabNet and FinTabNet together with randomly",
"orig": "ing in PubTabNet and FinTabNet together with randomly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 689.2,
"r_x1": 286.4,
"r_y1": 689.2,
"r_x2": 286.4,
"r_y2": 680.3,
"r_x3": 50.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "generated text. The first two synthetic datasets have been",
"orig": "generated text. The first two synthetic datasets have been",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "fine-tuned to mimic the appearance of the original datasets",
"orig": "fine-tuned to mimic the appearance of the original datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 286.4,
"r_y1": 713.2,
"r_x2": 286.4,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "but encompass more complicated table structures. The third",
"orig": "but encompass more complicated table structures. The third",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 412.3,
"r_y0": 82.5,
"r_x1": 430.9,
"r_y1": 82.5,
"r_x2": 430.9,
"r_y2": 73.6,
"r_x3": 412.3,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Tags",
"orig": "Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.9,
"r_y0": 82.5,
"r_x1": 464.4,
"r_y1": 82.5,
"r_x2": 464.4,
"r_y2": 73.6,
"r_x3": 442.9,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Bbox",
"orig": "Bbox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.8,
"r_y0": 82.5,
"r_x1": 494.9,
"r_y1": 82.5,
"r_x2": 494.9,
"r_y2": 73.6,
"r_x3": 477.8,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Size",
"orig": "Size",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.3,
"r_y0": 82.5,
"r_x1": 536.9,
"r_y1": 82.5,
"r_x2": 536.9,
"r_y2": 73.6,
"r_x3": 508.3,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Format",
"orig": "Format",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 94.9,
"r_x1": 361.6,
"r_y1": 94.9,
"r_x2": 361.6,
"r_y2": 86.0,
"r_x3": 317.1,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 94.9,
"r_x1": 425.4,
"r_y1": 94.9,
"r_x2": 425.4,
"r_y2": 85.7,
"r_x3": 417.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 94.9,
"r_x1": 457.4,
"r_y1": 94.9,
"r_x2": 457.4,
"r_y2": 85.7,
"r_x3": 449.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 94.9,
"r_x1": 496.3,
"r_y1": 94.9,
"r_x2": 496.3,
"r_y2": 86.0,
"r_x3": 476.4,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "509k",
"orig": "509k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 94.9,
"r_x1": 532.6,
"r_y1": 94.9,
"r_x2": 532.6,
"r_y2": 86.0,
"r_x3": 512.6,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 106.8,
"r_x1": 359.4,
"r_y1": 106.8,
"r_x2": 359.4,
"r_y2": 97.9,
"r_x3": 317.1,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 106.8,
"r_x1": 425.4,
"r_y1": 106.8,
"r_x2": 425.4,
"r_y2": 97.6,
"r_x3": 417.9,
"r_y3": 97.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 106.8,
"r_x1": 457.4,
"r_y1": 106.8,
"r_x2": 457.4,
"r_y2": 97.6,
"r_x3": 449.9,
"r_y3": 97.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 106.8,
"r_x1": 496.3,
"r_y1": 106.8,
"r_x2": 496.3,
"r_y2": 97.9,
"r_x3": 476.4,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "112k",
"orig": "112k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.5,
"r_y0": 106.8,
"r_x1": 531.7,
"r_y1": 106.8,
"r_x2": 531.7,
"r_y2": 97.9,
"r_x3": 513.5,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "PDF",
"orig": "PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 118.8,
"r_x1": 360.0,
"r_y1": 118.8,
"r_x2": 360.0,
"r_y2": 109.9,
"r_x3": 317.1,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "TableBank",
"orig": "TableBank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 118.8,
"r_x1": 425.4,
"r_y1": 118.8,
"r_x2": 425.4,
"r_y2": 109.6,
"r_x3": 417.9,
"r_y3": 109.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.8,
"r_y0": 118.8,
"r_x1": 456.5,
"r_y1": 118.8,
"r_x2": 456.5,
"r_y2": 109.6,
"r_x3": 450.8,
"r_y3": 109.6,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 118.8,
"r_x1": 496.3,
"r_y1": 118.8,
"r_x2": 496.3,
"r_y2": 109.9,
"r_x3": 476.4,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "145k",
"orig": "145k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.3,
"r_y0": 118.8,
"r_x1": 533.9,
"r_y1": 118.8,
"r_x2": 533.9,
"r_y2": 109.9,
"r_x3": 511.3,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "JPEG",
"orig": "JPEG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 130.7,
"r_x1": 400.4,
"r_y1": 130.7,
"r_x2": 400.4,
"r_y2": 121.8,
"r_x3": 317.1,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "Combined-Tabnet(*)",
"orig": "Combined-Tabnet(*)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 130.7,
"r_x1": 425.4,
"r_y1": 130.7,
"r_x2": 425.4,
"r_y2": 121.5,
"r_x3": 417.9,
"r_y3": 121.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 130.7,
"r_x1": 457.4,
"r_y1": 130.7,
"r_x2": 457.4,
"r_y2": 121.5,
"r_x3": 449.9,
"r_y3": 121.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 130.7,
"r_x1": 496.3,
"r_y1": 130.7,
"r_x2": 496.3,
"r_y2": 121.8,
"r_x3": 476.4,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "400k",
"orig": "400k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 130.7,
"r_x1": 532.6,
"r_y1": 130.7,
"r_x2": 532.6,
"r_y2": 121.8,
"r_x3": 512.6,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 142.7,
"r_x1": 375.2,
"r_y1": 142.7,
"r_x2": 375.2,
"r_y2": 133.8,
"r_x3": 317.1,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "Combined(**)",
"orig": "Combined(**)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 142.7,
"r_x1": 425.4,
"r_y1": 142.7,
"r_x2": 425.4,
"r_y2": 133.5,
"r_x3": 417.9,
"r_y3": 133.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 142.7,
"r_x1": 457.4,
"r_y1": 142.7,
"r_x2": 457.4,
"r_y2": 133.5,
"r_x3": 449.9,
"r_y3": 133.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 142.7,
"r_x1": 496.3,
"r_y1": 142.7,
"r_x2": 496.3,
"r_y2": 133.8,
"r_x3": 476.4,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "500k",
"orig": "500k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 142.7,
"r_x1": 532.6,
"r_y1": 142.7,
"r_x2": 532.6,
"r_y2": 133.8,
"r_x3": 512.6,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 154.6,
"r_x1": 369.4,
"r_y1": 154.6,
"r_x2": 369.4,
"r_y2": 145.7,
"r_x3": 317.1,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 154.7,
"r_x1": 425.4,
"r_y1": 154.7,
"r_x2": 425.4,
"r_y2": 145.4,
"r_x3": 417.9,
"r_y3": 145.4,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 154.7,
"r_x1": 457.4,
"r_y1": 154.7,
"r_x2": 457.4,
"r_y2": 145.4,
"r_x3": 449.9,
"r_y3": 145.4,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 154.6,
"r_x1": 496.3,
"r_y1": 154.6,
"r_x2": 496.3,
"r_y2": 145.7,
"r_x3": 476.4,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "600k",
"orig": "600k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 154.6,
"r_x1": 532.6,
"r_y1": 154.6,
"r_x2": 532.6,
"r_y2": 145.7,
"r_x3": 512.6,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 176.6,
"r_x1": 344.6,
"r_y1": 176.6,
"r_x2": 344.6,
"r_y2": 167.7,
"r_x3": 308.9,
"r_y3": 167.7,
"coord_origin": "TOPLEFT"
},
"text": "Table 1:",
"orig": "Table 1:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 361.1,
"r_y0": 176.6,
"r_x1": 380.5,
"r_y1": 176.6,
"r_x2": 380.5,
"r_y2": 167.7,
"r_x3": 361.1,
"r_y3": 167.7,
"coord_origin": "TOPLEFT"
},
"text": "Both",
"orig": "Both",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 386.6,
"r_y0": 176.3,
"r_x1": 468.7,
"r_y1": 176.3,
"r_x2": 468.7,
"r_y2": 167.8,
"r_x3": 386.6,
"r_y3": 167.8,
"coord_origin": "TOPLEFT"
},
"text": "\u201cCombined-Tabnet\u201d",
"orig": "\u201cCombined-Tabnet\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 474.8,
"r_y0": 176.6,
"r_x1": 489.2,
"r_y1": 176.6,
"r_x2": 489.2,
"r_y2": 167.7,
"r_x3": 474.8,
"r_y3": 167.7,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 495.3,
"r_y0": 176.3,
"r_x1": 545.1,
"r_y1": 176.3,
"r_x2": 545.1,
"r_y2": 167.8,
"r_x3": 495.3,
"r_y3": 167.8,
"coord_origin": "TOPLEFT"
},
"text": "\u201dCombined-",
"orig": "\u201dCombined-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 188.3,
"r_x1": 341.2,
"r_y1": 188.3,
"r_x2": 341.2,
"r_y2": 179.7,
"r_x3": 308.9,
"r_y3": 179.7,
"coord_origin": "TOPLEFT"
},
"text": "Tabnet\u201d",
"orig": "Tabnet\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 343.5,
"r_y0": 188.5,
"r_x1": 545.1,
"r_y1": 188.5,
"r_x2": 545.1,
"r_y2": 179.6,
"r_x3": 343.5,
"r_y3": 179.6,
"coord_origin": "TOPLEFT"
},
"text": "are variations of the following: (*) The Combined-",
"orig": "are variations of the following: (*) The Combined-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 200.5,
"r_x1": 545.1,
"r_y1": 200.5,
"r_x2": 545.1,
"r_y2": 191.6,
"r_x3": 308.9,
"r_y3": 191.6,
"coord_origin": "TOPLEFT"
},
"text": "Tabnet dataset is the processed combination of PubTabNet",
"orig": "Tabnet dataset is the processed combination of PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 212.4,
"r_x1": 545.1,
"r_y1": 212.4,
"r_x2": 545.1,
"r_y2": 203.5,
"r_x3": 308.9,
"r_y3": 203.5,
"coord_origin": "TOPLEFT"
},
"text": "and Fintabnet. (**) The combined dataset is the processed",
"orig": "and Fintabnet. (**) The combined dataset is the processed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 224.4,
"r_x1": 523.9,
"r_y1": 224.4,
"r_x2": 523.9,
"r_y2": 215.5,
"r_x3": 308.9,
"r_y3": 215.5,
"coord_origin": "TOPLEFT"
},
"text": "combination of PubTabNet, Fintabnet and TableBank.",
"orig": "combination of PubTabNet, Fintabnet and TableBank.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 258.5,
"r_x1": 545.1,
"r_y1": 258.5,
"r_x2": 545.1,
"r_y2": 249.6,
"r_x3": 308.9,
"r_y3": 249.6,
"coord_origin": "TOPLEFT"
},
"text": "one adopts a colorful appearance with high contrast and the",
"orig": "one adopts a colorful appearance with high contrast and the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 270.5,
"r_x1": 545.1,
"r_y1": 270.5,
"r_x2": 545.1,
"r_y2": 261.6,
"r_x3": 308.9,
"r_y3": 261.6,
"coord_origin": "TOPLEFT"
},
"text": "last one contains tables with sparse content. Lastly, we have",
"orig": "last one contains tables with sparse content. Lastly, we have",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 282.4,
"r_x1": 545.1,
"r_y1": 282.4,
"r_x2": 545.1,
"r_y2": 273.5,
"r_x3": 308.9,
"r_y3": 273.5,
"coord_origin": "TOPLEFT"
},
"text": "combined all synthetic datasets into one big unified syn-",
"orig": "combined all synthetic datasets into one big unified syn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 294.4,
"r_x1": 436.8,
"r_y1": 294.4,
"r_x2": 436.8,
"r_y2": 285.5,
"r_x3": 308.9,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "thetic dataset of 600k examples.",
"orig": "thetic dataset of 600k examples.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 306.7,
"r_x1": 542.7,
"r_y1": 306.7,
"r_x2": 542.7,
"r_y2": 297.8,
"r_x3": 320.8,
"r_y3": 297.8,
"coord_origin": "TOPLEFT"
},
"text": "Tab. 1 summarizes the various attributes of the datasets.",
"orig": "Tab. 1 summarizes the various attributes of the datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 331.9,
"r_x1": 316.3,
"r_y1": 331.9,
"r_x2": 316.3,
"r_y2": 321.2,
"r_x3": 308.9,
"r_y3": 321.2,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.2,
"r_y0": 331.9,
"r_x1": 444.9,
"r_y1": 331.9,
"r_x2": 444.9,
"r_y2": 321.2,
"r_x3": 326.2,
"r_y3": 321.2,
"coord_origin": "TOPLEFT"
},
"text": "The TableFormer model",
"orig": "The TableFormer model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 350.8,
"r_x1": 545.1,
"r_y1": 350.8,
"r_x2": 545.1,
"r_y2": 341.9,
"r_x3": 320.8,
"r_y3": 341.9,
"coord_origin": "TOPLEFT"
},
"text": "Given the image of a table, TableFormer is able to pre-",
"orig": "Given the image of a table, TableFormer is able to pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 362.8,
"r_x1": 545.1,
"r_y1": 362.8,
"r_x2": 545.1,
"r_y2": 353.9,
"r_x3": 308.9,
"r_y3": 353.9,
"coord_origin": "TOPLEFT"
},
"text": "dict: 1) a sequence of tokens that represent the structure of",
"orig": "dict: 1) a sequence of tokens that represent the structure of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 374.8,
"r_x1": 545.1,
"r_y1": 374.8,
"r_x2": 545.1,
"r_y2": 365.8,
"r_x3": 308.9,
"r_y3": 365.8,
"coord_origin": "TOPLEFT"
},
"text": "a table, and 2) a bounding box coupled to a subset of those",
"orig": "a table, and 2) a bounding box coupled to a subset of those",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 386.7,
"r_x1": 545.1,
"r_y1": 386.7,
"r_x2": 545.1,
"r_y2": 377.8,
"r_x3": 308.9,
"r_y3": 377.8,
"coord_origin": "TOPLEFT"
},
"text": "tokens. The conversion of an image into a sequence of to-",
"orig": "tokens. The conversion of an image into a sequence of to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 398.7,
"r_x1": 545.1,
"r_y1": 398.7,
"r_x2": 545.1,
"r_y2": 389.8,
"r_x3": 308.9,
"r_y3": 389.8,
"coord_origin": "TOPLEFT"
},
"text": "kens is a well-known task [35, 16]. While attention is often",
"orig": "kens is a well-known task [35, 16]. While attention is often",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 410.6,
"r_x1": 545.1,
"r_y1": 410.6,
"r_x2": 545.1,
"r_y2": 401.7,
"r_x3": 308.9,
"r_y3": 401.7,
"coord_origin": "TOPLEFT"
},
"text": "used as an implicit method to associate each token of the",
"orig": "used as an implicit method to associate each token of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 422.6,
"r_x1": 545.1,
"r_y1": 422.6,
"r_x2": 545.1,
"r_y2": 413.7,
"r_x3": 308.9,
"r_y3": 413.7,
"coord_origin": "TOPLEFT"
},
"text": "sequence with a position in the original image, an explicit",
"orig": "sequence with a position in the original image, an explicit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 434.5,
"r_x1": 545.1,
"r_y1": 434.5,
"r_x2": 545.1,
"r_y2": 425.6,
"r_x3": 308.9,
"r_y3": 425.6,
"coord_origin": "TOPLEFT"
},
"text": "association between the individual table-cells and the image",
"orig": "association between the individual table-cells and the image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 446.5,
"r_x1": 437.9,
"r_y1": 446.5,
"r_x2": 437.9,
"r_y2": 437.6,
"r_x3": 308.9,
"r_y3": 437.6,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes is also required.",
"orig": "bounding boxes is also required.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 467.5,
"r_x1": 323.1,
"r_y1": 467.5,
"r_x2": 323.1,
"r_y2": 457.7,
"r_x3": 308.9,
"r_y3": 457.7,
"coord_origin": "TOPLEFT"
},
"text": "4.1.",
"orig": "4.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 332.7,
"r_y0": 467.5,
"r_x1": 420.2,
"r_y1": 467.5,
"r_x2": 420.2,
"r_y2": 457.7,
"r_x3": 332.7,
"r_y3": 457.7,
"coord_origin": "TOPLEFT"
},
"text": "Model architecture.",
"orig": "Model architecture.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 485.7,
"r_x1": 545.1,
"r_y1": 485.7,
"r_x2": 545.1,
"r_y2": 476.8,
"r_x3": 320.8,
"r_y3": 476.8,
"coord_origin": "TOPLEFT"
},
"text": "We now describe in detail the proposed method, which",
"orig": "We now describe in detail the proposed method, which",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 497.6,
"r_x1": 509.0,
"r_y1": 497.6,
"r_x2": 509.0,
"r_y2": 488.7,
"r_x3": 308.9,
"r_y3": 488.7,
"coord_origin": "TOPLEFT"
},
"text": "is composed of three main components, see Fig.",
"orig": "is composed of three main components, see Fig.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.6,
"r_y0": 497.6,
"r_x1": 523.1,
"r_y1": 497.6,
"r_x2": 523.1,
"r_y2": 488.7,
"r_x3": 515.6,
"r_y3": 488.7,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 529.6,
"r_y0": 497.6,
"r_x1": 545.1,
"r_y1": 497.6,
"r_x2": 545.1,
"r_y2": 488.7,
"r_x3": 529.6,
"r_y3": 488.7,
"coord_origin": "TOPLEFT"
},
"text": "Our",
"orig": "Our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 509.4,
"r_x1": 406.3,
"r_y1": 509.4,
"r_x2": 406.3,
"r_y2": 500.8,
"r_x3": 308.9,
"r_y3": 500.8,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network",
"orig": "CNN Backbone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.9,
"r_y0": 509.6,
"r_x1": 545.1,
"r_y1": 509.6,
"r_x2": 545.1,
"r_y2": 500.7,
"r_x3": 408.9,
"r_y3": 500.7,
"coord_origin": "TOPLEFT"
},
"text": "encodes the input as a feature vec-",
"orig": "encodes the input as a feature vec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 521.5,
"r_x1": 409.4,
"r_y1": 521.5,
"r_x2": 409.4,
"r_y2": 512.6,
"r_x3": 308.9,
"r_y3": 512.6,
"coord_origin": "TOPLEFT"
},
"text": "tor of predefined length.",
"orig": "tor of predefined length.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 416.7,
"r_y0": 521.5,
"r_x1": 545.1,
"r_y1": 521.5,
"r_x2": 545.1,
"r_y2": 512.6,
"r_x3": 416.7,
"r_y3": 512.6,
"coord_origin": "TOPLEFT"
},
"text": "The input feature vector of the",
"orig": "The input feature vector of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 533.5,
"r_x1": 436.2,
"r_y1": 533.5,
"r_x2": 436.2,
"r_y2": 524.6,
"r_x3": 308.9,
"r_y3": 524.6,
"coord_origin": "TOPLEFT"
},
"text": "encoded image is passed to the",
"orig": "encoded image is passed to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 439.5,
"r_y0": 533.3,
"r_x1": 513.9,
"r_y1": 533.3,
"r_x2": 513.9,
"r_y2": 524.7,
"r_x3": 439.5,
"r_y3": 524.7,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 517.4,
"r_y0": 533.5,
"r_x1": 545.1,
"r_y1": 533.5,
"r_x2": 545.1,
"r_y2": 524.6,
"r_x3": 517.4,
"r_y3": 524.6,
"coord_origin": "TOPLEFT"
},
"text": "to pro-",
"orig": "to pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 545.4,
"r_x1": 545.1,
"r_y1": 545.4,
"r_x2": 545.1,
"r_y2": 536.5,
"r_x3": 308.9,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "duce a sequence of HTML tags that represent the structure",
"orig": "duce a sequence of HTML tags that represent the structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 557.4,
"r_x1": 358.5,
"r_y1": 557.4,
"r_x2": 358.5,
"r_y2": 548.5,
"r_x3": 308.9,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "of the table.",
"orig": "of the table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 365.2,
"r_y0": 557.4,
"r_x1": 545.1,
"r_y1": 557.4,
"r_x2": 545.1,
"r_y2": 548.5,
"r_x3": 365.2,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "With each prediction of an HTML standard",
"orig": "With each prediction of an HTML standard",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 569.4,
"r_x1": 352.4,
"r_y1": 569.4,
"r_x2": 352.4,
"r_y2": 560.5,
"r_x3": 308.9,
"r_y3": 560.5,
"coord_origin": "TOPLEFT"
},
"text": "data cell (\u2018",
"orig": "data cell (\u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.4,
"r_y0": 569.1,
"r_x1": 360.2,
"r_y1": 569.1,
"r_x2": 360.2,
"r_y2": 560.3,
"r_x3": 352.4,
"r_y3": 560.3,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.2,
"r_y0": 569.4,
"r_x1": 367.9,
"r_y1": 569.4,
"r_x2": 367.9,
"r_y2": 560.5,
"r_x3": 360.2,
"r_y3": 560.5,
"coord_origin": "TOPLEFT"
},
"text": "td",
"orig": "td",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.9,
"r_y0": 569.1,
"r_x1": 375.7,
"r_y1": 569.1,
"r_x2": 375.7,
"r_y2": 560.3,
"r_x3": 367.9,
"r_y3": 560.3,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 375.7,
"r_y0": 569.4,
"r_x1": 545.1,
"r_y1": 569.4,
"r_x2": 545.1,
"r_y2": 560.5,
"r_x3": 375.7,
"r_y3": 560.5,
"coord_origin": "TOPLEFT"
},
"text": "\u2019) the hidden state of that cell is passed to",
"orig": "\u2019) the hidden state of that cell is passed to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 581.3,
"r_x1": 545.1,
"r_y1": 581.3,
"r_x2": 545.1,
"r_y2": 572.4,
"r_x3": 308.9,
"r_y3": 572.4,
"coord_origin": "TOPLEFT"
},
"text": "the Cell BBox Decoder. As for spanning cells, such as row",
"orig": "the Cell BBox Decoder. As for spanning cells, such as row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 593.3,
"r_x1": 483.1,
"r_y1": 593.3,
"r_x2": 483.1,
"r_y2": 584.4,
"r_x3": 308.9,
"r_y3": 584.4,
"coord_origin": "TOPLEFT"
},
"text": "or column span, the tag is broken down to \u2018",
"orig": "or column span, the tag is broken down to \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.1,
"r_y0": 593.0,
"r_x1": 490.9,
"r_y1": 593.0,
"r_x2": 490.9,
"r_y2": 584.2,
"r_x3": 483.1,
"r_y3": 584.2,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.9,
"r_y0": 593.3,
"r_x1": 545.1,
"r_y1": 593.3,
"r_x2": 545.1,
"r_y2": 584.4,
"r_x3": 490.9,
"r_y3": 584.4,
"coord_origin": "TOPLEFT"
},
"text": "\u2019, \u2018rowspan=\u2019",
"orig": "\u2019, \u2018rowspan=\u2019",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 605.2,
"r_x1": 545.1,
"r_y1": 605.2,
"r_x2": 545.1,
"r_y2": 596.3,
"r_x3": 308.9,
"r_y3": 596.3,
"coord_origin": "TOPLEFT"
},
"text": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),",
"orig": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 617.2,
"r_x1": 329.6,
"r_y1": 617.2,
"r_x2": 329.6,
"r_y2": 608.3,
"r_x3": 308.9,
"r_y3": 608.3,
"coord_origin": "TOPLEFT"
},
"text": "and \u2018",
"orig": "and \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.6,
"r_y0": 617.0,
"r_x1": 337.4,
"r_y1": 617.0,
"r_x2": 337.4,
"r_y2": 608.1,
"r_x3": 329.6,
"r_y3": 608.1,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 337.4,
"r_y0": 617.2,
"r_x1": 468.6,
"r_y1": 617.2,
"r_x2": 468.6,
"r_y2": 608.3,
"r_x3": 337.4,
"r_y3": 608.3,
"coord_origin": "TOPLEFT"
},
"text": "\u2019. The hidden state attached to \u2018",
"orig": "\u2019. The hidden state attached to \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.6,
"r_y0": 617.0,
"r_x1": 476.3,
"r_y1": 617.0,
"r_x2": 476.3,
"r_y2": 608.1,
"r_x3": 468.6,
"r_y3": 608.1,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.3,
"r_y0": 617.2,
"r_x1": 545.1,
"r_y1": 617.2,
"r_x2": 545.1,
"r_y2": 608.3,
"r_x3": 476.3,
"r_y3": 608.3,
"coord_origin": "TOPLEFT"
},
"text": "\u2019 is passed to the",
"orig": "\u2019 is passed to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 629.1,
"r_x1": 545.1,
"r_y1": 629.1,
"r_x2": 545.1,
"r_y2": 620.2,
"r_x3": 308.9,
"r_y3": 620.2,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder. A shared feed forward network (FFN)",
"orig": "Cell BBox Decoder. A shared feed forward network (FFN)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 641.1,
"r_x1": 545.1,
"r_y1": 641.1,
"r_x2": 545.1,
"r_y2": 632.2,
"r_x3": 308.9,
"r_y3": 632.2,
"coord_origin": "TOPLEFT"
},
"text": "receives the hidden states from the Structure Decoder, to",
"orig": "receives the hidden states from the Structure Decoder, to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 653.0,
"r_x1": 545.1,
"r_y1": 653.0,
"r_x2": 545.1,
"r_y2": 644.1,
"r_x3": 308.9,
"r_y3": 644.1,
"coord_origin": "TOPLEFT"
},
"text": "provide the final detection predictions of the bounding box",
"orig": "provide the final detection predictions of the bounding box",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 665.0,
"r_x1": 449.4,
"r_y1": 665.0,
"r_x2": 449.4,
"r_y2": 656.1,
"r_x3": 308.9,
"r_y3": 656.1,
"coord_origin": "TOPLEFT"
},
"text": "coordinates and their classification.",
"orig": "coordinates and their classification.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 677.2,
"r_x1": 431.9,
"r_y1": 677.2,
"r_x2": 431.9,
"r_y2": 668.3,
"r_x3": 320.8,
"r_y3": 668.3,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network.",
"orig": "CNN Backbone Network.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 439.5,
"r_y0": 677.3,
"r_x1": 545.1,
"r_y1": 677.3,
"r_x2": 545.1,
"r_y2": 668.4,
"r_x3": 439.5,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "A ResNet-18 CNN is the",
"orig": "A ResNet-18 CNN is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 689.2,
"r_x1": 545.1,
"r_y1": 689.2,
"r_x2": 545.1,
"r_y2": 680.3,
"r_x3": 308.9,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "backbone that receives the table image and encodes it as a",
"orig": "backbone that receives the table image and encodes it as a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 308.9,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "vector of predefined length. The network has been modified",
"orig": "vector of predefined length. The network has been modified",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 545.1,
"r_y1": 713.2,
"r_x2": 545.1,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "by removing the linear and pooling layer, as we are not per-",
"orig": "by removing the linear and pooling layer, as we are not per-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 10,
"label": "text",
"bbox": {
"l": 50.1,
"t": 75.2,
"r": 286.4,
"b": 96.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.1,
"r_x1": 286.4,
"r_y1": 84.1,
"r_x2": 286.4,
"r_y2": 75.2,
"r_x3": 50.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "amount of such tables, and kept only those ones ranging",
"orig": "amount of such tables, and kept only those ones ranging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 96.1,
"r_x1": 212.3,
"r_y1": 96.1,
"r_x2": 212.3,
"r_y2": 87.2,
"r_x3": 50.1,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "between 1*1 and 20*10 (rows/columns).",
"orig": "between 1*1 and 20*10 (rows/columns).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "text",
"bbox": {
"l": 50.1,
"t": 101.0,
"r": 286.4,
"b": 313.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 109.9,
"r_x1": 286.4,
"r_y1": 109.9,
"r_x2": 286.4,
"r_y2": 101.0,
"r_x3": 62.1,
"r_y3": 101.0,
"coord_origin": "TOPLEFT"
},
"text": "The availability of the bounding boxes for all table cells",
"orig": "The availability of the bounding boxes for all table cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 121.8,
"r_x1": 286.4,
"r_y1": 121.8,
"r_x2": 286.4,
"r_y2": 112.9,
"r_x3": 50.1,
"r_y3": 112.9,
"coord_origin": "TOPLEFT"
},
"text": "is essential to train our models. In order to distinguish be-",
"orig": "is essential to train our models. In order to distinguish be-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 133.8,
"r_x1": 286.4,
"r_y1": 133.8,
"r_x2": 286.4,
"r_y2": 124.9,
"r_x3": 50.1,
"r_y3": 124.9,
"coord_origin": "TOPLEFT"
},
"text": "tween empty and non-empty bounding boxes, we have in-",
"orig": "tween empty and non-empty bounding boxes, we have in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 145.7,
"r_x1": 286.4,
"r_y1": 145.7,
"r_x2": 286.4,
"r_y2": 136.8,
"r_x3": 50.1,
"r_y3": 136.8,
"coord_origin": "TOPLEFT"
},
"text": "troduced a binary class in the annotation. Unfortunately, the",
"orig": "troduced a binary class in the annotation. Unfortunately, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 157.7,
"r_x1": 286.4,
"r_y1": 157.7,
"r_x2": 286.4,
"r_y2": 148.8,
"r_x3": 50.1,
"r_y3": 148.8,
"coord_origin": "TOPLEFT"
},
"text": "original datasets either omit the bounding boxes for whole",
"orig": "original datasets either omit the bounding boxes for whole",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 169.6,
"r_x1": 286.4,
"r_y1": 169.6,
"r_x2": 286.4,
"r_y2": 160.7,
"r_x3": 50.1,
"r_y3": 160.7,
"coord_origin": "TOPLEFT"
},
"text": "tables (e.g. TableBank) or they narrow their scope only to",
"orig": "tables (e.g. TableBank) or they narrow their scope only to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 181.6,
"r_x1": 286.4,
"r_y1": 181.6,
"r_x2": 286.4,
"r_y2": 172.7,
"r_x3": 50.1,
"r_y3": 172.7,
"coord_origin": "TOPLEFT"
},
"text": "non-empty cells. Therefore, it was imperative to introduce",
"orig": "non-empty cells. Therefore, it was imperative to introduce",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 193.6,
"r_x1": 286.4,
"r_y1": 193.6,
"r_x2": 286.4,
"r_y2": 184.6,
"r_x3": 50.1,
"r_y3": 184.6,
"coord_origin": "TOPLEFT"
},
"text": "a data pre-processing procedure that generates the missing",
"orig": "a data pre-processing procedure that generates the missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 205.5,
"r_x1": 286.4,
"r_y1": 205.5,
"r_x2": 286.4,
"r_y2": 196.6,
"r_x3": 50.1,
"r_y3": 196.6,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes out of the annotation information. This pro-",
"orig": "bounding boxes out of the annotation information. This pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 217.5,
"r_x1": 286.4,
"r_y1": 217.5,
"r_x2": 286.4,
"r_y2": 208.6,
"r_x3": 50.1,
"r_y3": 208.6,
"coord_origin": "TOPLEFT"
},
"text": "cedure first parses the provided table structure and calcu-",
"orig": "cedure first parses the provided table structure and calcu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 229.4,
"r_x1": 286.4,
"r_y1": 229.4,
"r_x2": 286.4,
"r_y2": 220.5,
"r_x3": 50.1,
"r_y3": 220.5,
"coord_origin": "TOPLEFT"
},
"text": "lates the dimensions of the most fine-grained grid that cov-",
"orig": "lates the dimensions of the most fine-grained grid that cov-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 241.4,
"r_x1": 286.4,
"r_y1": 241.4,
"r_x2": 286.4,
"r_y2": 232.5,
"r_x3": 50.1,
"r_y3": 232.5,
"coord_origin": "TOPLEFT"
},
"text": "ers the table structure. Notice that each table cell may oc-",
"orig": "ers the table structure. Notice that each table cell may oc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 253.3,
"r_x1": 286.4,
"r_y1": 253.3,
"r_x2": 286.4,
"r_y2": 244.4,
"r_x3": 50.1,
"r_y3": 244.4,
"coord_origin": "TOPLEFT"
},
"text": "cupy multiple grid squares due to row or column spans. In",
"orig": "cupy multiple grid squares due to row or column spans. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 265.3,
"r_x1": 286.4,
"r_y1": 265.3,
"r_x2": 286.4,
"r_y2": 256.4,
"r_x3": 50.1,
"r_y3": 256.4,
"coord_origin": "TOPLEFT"
},
"text": "case of PubTabNet we had to compute missing bounding",
"orig": "case of PubTabNet we had to compute missing bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 277.2,
"r_x1": 286.4,
"r_y1": 277.2,
"r_x2": 286.4,
"r_y2": 268.3,
"r_x3": 50.1,
"r_y3": 268.3,
"coord_origin": "TOPLEFT"
},
"text": "boxes for 48% of the simple and 69% of the complex ta-",
"orig": "boxes for 48% of the simple and 69% of the complex ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 289.2,
"r_x1": 68.7,
"r_y1": 289.2,
"r_x2": 68.7,
"r_y2": 280.3,
"r_x3": 50.1,
"r_y3": 280.3,
"coord_origin": "TOPLEFT"
},
"text": "bles.",
"orig": "bles.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 75.6,
"r_y0": 289.2,
"r_x1": 286.4,
"r_y1": 289.2,
"r_x2": 286.4,
"r_y2": 280.3,
"r_x3": 75.6,
"r_y3": 280.3,
"coord_origin": "TOPLEFT"
},
"text": "Regarding FinTabNet, 68% of the simple and 98%",
"orig": "Regarding FinTabNet, 68% of the simple and 98%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 301.2,
"r_x1": 286.4,
"r_y1": 301.2,
"r_x2": 286.4,
"r_y2": 292.2,
"r_x3": 50.1,
"r_y3": 292.2,
"coord_origin": "TOPLEFT"
},
"text": "of the complex tables require the generation of bounding",
"orig": "of the complex tables require the generation of bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 313.1,
"r_x1": 75.7,
"r_y1": 313.1,
"r_x2": 75.7,
"r_y2": 304.2,
"r_x3": 50.1,
"r_y3": 304.2,
"coord_origin": "TOPLEFT"
},
"text": "boxes.",
"orig": "boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "text",
"bbox": {
"l": 50.1,
"t": 318.0,
"r": 286.4,
"b": 434.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 326.9,
"r_x1": 286.4,
"r_y1": 326.9,
"r_x2": 286.4,
"r_y2": 318.0,
"r_x3": 62.1,
"r_y3": 318.0,
"coord_origin": "TOPLEFT"
},
"text": "As it is illustrated in Fig. 2, the table distributions from",
"orig": "As it is illustrated in Fig. 2, the table distributions from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 338.9,
"r_x1": 286.4,
"r_y1": 338.9,
"r_x2": 286.4,
"r_y2": 330.0,
"r_x3": 50.1,
"r_y3": 330.0,
"coord_origin": "TOPLEFT"
},
"text": "all datasets are skewed towards simpler structures with",
"orig": "all datasets are skewed towards simpler structures with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 350.8,
"r_x1": 286.4,
"r_y1": 350.8,
"r_x2": 286.4,
"r_y2": 341.9,
"r_x3": 50.1,
"r_y3": 341.9,
"coord_origin": "TOPLEFT"
},
"text": "fewer number of rows/columns. Additionally, there is very",
"orig": "fewer number of rows/columns. Additionally, there is very",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 362.8,
"r_x1": 286.4,
"r_y1": 362.8,
"r_x2": 286.4,
"r_y2": 353.9,
"r_x3": 50.1,
"r_y3": 353.9,
"coord_origin": "TOPLEFT"
},
"text": "limited variance in the table styles, which in case of Pub-",
"orig": "limited variance in the table styles, which in case of Pub-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 374.7,
"r_x1": 286.4,
"r_y1": 374.7,
"r_x2": 286.4,
"r_y2": 365.8,
"r_x3": 50.1,
"r_y3": 365.8,
"coord_origin": "TOPLEFT"
},
"text": "TabNet and FinTabNet means one styling format for the",
"orig": "TabNet and FinTabNet means one styling format for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 386.7,
"r_x1": 141.6,
"r_y1": 386.7,
"r_x2": 141.6,
"r_y2": 377.8,
"r_x3": 50.1,
"r_y3": 377.8,
"coord_origin": "TOPLEFT"
},
"text": "majority of the tables.",
"orig": "majority of the tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 148.7,
"r_y0": 386.7,
"r_x1": 286.4,
"r_y1": 386.7,
"r_x2": 286.4,
"r_y2": 377.8,
"r_x3": 148.7,
"r_y3": 377.8,
"coord_origin": "TOPLEFT"
},
"text": "Similar limitations appear also in",
"orig": "Similar limitations appear also in",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 398.6,
"r_x1": 286.4,
"r_y1": 398.6,
"r_x2": 286.4,
"r_y2": 389.7,
"r_x3": 50.1,
"r_y3": 389.7,
"coord_origin": "TOPLEFT"
},
"text": "the type of table content, which in some cases (e.g. FinTab-",
"orig": "the type of table content, which in some cases (e.g. FinTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 410.6,
"r_x1": 286.4,
"r_y1": 410.6,
"r_x2": 286.4,
"r_y2": 401.7,
"r_x3": 50.1,
"r_y3": 401.7,
"coord_origin": "TOPLEFT"
},
"text": "Net) is restricted to a certain domain. Ultimately, the lack",
"orig": "Net) is restricted to a certain domain. Ultimately, the lack",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 422.5,
"r_x1": 286.4,
"r_y1": 422.5,
"r_x2": 286.4,
"r_y2": 413.6,
"r_x3": 50.1,
"r_y3": 413.6,
"coord_origin": "TOPLEFT"
},
"text": "of diversity in the training dataset damages the ability of the",
"orig": "of diversity in the training dataset damages the ability of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 434.5,
"r_x1": 216.4,
"r_y1": 434.5,
"r_x2": 216.4,
"r_y2": 425.6,
"r_x3": 50.1,
"r_y3": 425.6,
"coord_origin": "TOPLEFT"
},
"text": "models to generalize well on unseen data.",
"orig": "models to generalize well on unseen data.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "text",
"bbox": {
"l": 50.1,
"t": 439.4,
"r": 286.4,
"b": 627.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 448.3,
"r_x1": 286.4,
"r_y1": 448.3,
"r_x2": 286.4,
"r_y2": 439.4,
"r_x3": 62.1,
"r_y3": 439.4,
"coord_origin": "TOPLEFT"
},
"text": "Motivated by those observations we aimed at generating",
"orig": "Motivated by those observations we aimed at generating",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 460.3,
"r_x1": 172.1,
"r_y1": 460.3,
"r_x2": 172.1,
"r_y2": 451.3,
"r_x3": 50.1,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": "a synthetic table dataset named",
"orig": "a synthetic table dataset named",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 174.1,
"r_y0": 460.0,
"r_x1": 224.7,
"r_y1": 460.0,
"r_x2": 224.7,
"r_y2": 451.4,
"r_x3": 174.1,
"r_y3": 451.4,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 224.7,
"r_y0": 460.3,
"r_x1": 286.4,
"r_y1": 460.3,
"r_x2": 286.4,
"r_y2": 451.3,
"r_x3": 224.7,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": ". This approach",
"orig": ". This approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 472.2,
"r_x1": 286.4,
"r_y1": 472.2,
"r_x2": 286.4,
"r_y2": 463.3,
"r_x3": 50.1,
"r_y3": 463.3,
"coord_origin": "TOPLEFT"
},
"text": "offers control over: 1) the size of the dataset, 2) the table",
"orig": "offers control over: 1) the size of the dataset, 2) the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 484.2,
"r_x1": 286.4,
"r_y1": 484.2,
"r_x2": 286.4,
"r_y2": 475.3,
"r_x3": 50.1,
"r_y3": 475.3,
"coord_origin": "TOPLEFT"
},
"text": "structure, 3) the table style and 4) the type of content. The",
"orig": "structure, 3) the table style and 4) the type of content. The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 496.1,
"r_x1": 286.4,
"r_y1": 496.1,
"r_x2": 286.4,
"r_y2": 487.2,
"r_x3": 50.1,
"r_y3": 487.2,
"coord_origin": "TOPLEFT"
},
"text": "complexity of the table structure is described by the size of",
"orig": "complexity of the table structure is described by the size of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 508.1,
"r_x1": 286.4,
"r_y1": 508.1,
"r_x2": 286.4,
"r_y2": 499.2,
"r_x3": 50.1,
"r_y3": 499.2,
"coord_origin": "TOPLEFT"
},
"text": "the table header and the table body, as well as the percentage",
"orig": "the table header and the table body, as well as the percentage",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 520.0,
"r_x1": 286.4,
"r_y1": 520.0,
"r_x2": 286.4,
"r_y2": 511.1,
"r_x3": 50.1,
"r_y3": 511.1,
"coord_origin": "TOPLEFT"
},
"text": "of the table cells covered by row spans and column spans.",
"orig": "of the table cells covered by row spans and column spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 532.0,
"r_x1": 286.4,
"r_y1": 532.0,
"r_x2": 286.4,
"r_y2": 523.1,
"r_x3": 50.1,
"r_y3": 523.1,
"coord_origin": "TOPLEFT"
},
"text": "A set of carefully designed styling templates provides the",
"orig": "A set of carefully designed styling templates provides the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 543.9,
"r_x1": 286.4,
"r_y1": 543.9,
"r_x2": 286.4,
"r_y2": 535.0,
"r_x3": 50.1,
"r_y3": 535.0,
"coord_origin": "TOPLEFT"
},
"text": "basis to build a wide range of table appearances. Lastly, the",
"orig": "basis to build a wide range of table appearances. Lastly, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 555.9,
"r_x1": 286.4,
"r_y1": 555.9,
"r_x2": 286.4,
"r_y2": 547.0,
"r_x3": 50.1,
"r_y3": 547.0,
"coord_origin": "TOPLEFT"
},
"text": "table content is generated out of a curated collection of text",
"orig": "table content is generated out of a curated collection of text",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 567.8,
"r_x1": 286.4,
"r_y1": 567.8,
"r_x2": 286.4,
"r_y2": 558.9,
"r_x3": 50.1,
"r_y3": 558.9,
"coord_origin": "TOPLEFT"
},
"text": "corpora. By controlling the size and scope of the synthetic",
"orig": "corpora. By controlling the size and scope of the synthetic",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 579.8,
"r_x1": 286.4,
"r_y1": 579.8,
"r_x2": 286.4,
"r_y2": 570.9,
"r_x3": 50.1,
"r_y3": 570.9,
"coord_origin": "TOPLEFT"
},
"text": "datasets we are able to train and evaluate our models in a",
"orig": "datasets we are able to train and evaluate our models in a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 591.8,
"r_x1": 286.4,
"r_y1": 591.8,
"r_x2": 286.4,
"r_y2": 582.9,
"r_x3": 50.1,
"r_y3": 582.9,
"coord_origin": "TOPLEFT"
},
"text": "variety of different conditions. For example, we can first",
"orig": "variety of different conditions. For example, we can first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 603.7,
"r_x1": 286.4,
"r_y1": 603.7,
"r_x2": 286.4,
"r_y2": 594.8,
"r_x3": 50.1,
"r_y3": 594.8,
"coord_origin": "TOPLEFT"
},
"text": "generate a highly diverse dataset to train our models and",
"orig": "generate a highly diverse dataset to train our models and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 615.7,
"r_x1": 286.4,
"r_y1": 615.7,
"r_x2": 286.4,
"r_y2": 606.8,
"r_x3": 50.1,
"r_y3": 606.8,
"coord_origin": "TOPLEFT"
},
"text": "then evaluate their performance on other synthetic datasets",
"orig": "then evaluate their performance on other synthetic datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 627.6,
"r_x1": 209.8,
"r_y1": 627.6,
"r_x2": 209.8,
"r_y2": 618.7,
"r_x3": 50.1,
"r_y3": 618.7,
"coord_origin": "TOPLEFT"
},
"text": "which are focused on a specific domain.",
"orig": "which are focused on a specific domain.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 5,
"label": "text",
"bbox": {
"l": 50.1,
"t": 632.5,
"r": 286.4,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 641.4,
"r_x1": 286.4,
"r_y1": 641.4,
"r_x2": 286.4,
"r_y2": 632.5,
"r_x3": 62.1,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": "In this regard, we have prepared four synthetic datasets,",
"orig": "In this regard, we have prepared four synthetic datasets,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 653.4,
"r_x1": 286.4,
"r_y1": 653.4,
"r_x2": 286.4,
"r_y2": 644.5,
"r_x3": 50.1,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "each one containing 150k examples. The corpora to gener-",
"orig": "each one containing 150k examples. The corpora to gener-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 665.3,
"r_x1": 286.4,
"r_y1": 665.3,
"r_x2": 286.4,
"r_y2": 656.4,
"r_x3": 50.1,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "ate the table text consists of the most frequent terms appear-",
"orig": "ate the table text consists of the most frequent terms appear-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.3,
"r_x1": 286.4,
"r_y1": 677.3,
"r_x2": 286.4,
"r_y2": 668.4,
"r_x3": 50.1,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "ing in PubTabNet and FinTabNet together with randomly",
"orig": "ing in PubTabNet and FinTabNet together with randomly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 689.2,
"r_x1": 286.4,
"r_y1": 689.2,
"r_x2": 286.4,
"r_y2": 680.3,
"r_x3": 50.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "generated text. The first two synthetic datasets have been",
"orig": "generated text. The first two synthetic datasets have been",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "fine-tuned to mimic the appearance of the original datasets",
"orig": "fine-tuned to mimic the appearance of the original datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 286.4,
"r_y1": 713.2,
"r_x2": 286.4,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "but encompass more complicated table structures. The third",
"orig": "but encompass more complicated table structures. The third",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 8,
"label": "table",
"bbox": {
"l": 310.7,
"t": 73.2,
"r": 543.0,
"b": 155.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 412.3,
"r_y0": 82.5,
"r_x1": 430.9,
"r_y1": 82.5,
"r_x2": 430.9,
"r_y2": 73.6,
"r_x3": 412.3,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Tags",
"orig": "Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.9,
"r_y0": 82.5,
"r_x1": 464.4,
"r_y1": 82.5,
"r_x2": 464.4,
"r_y2": 73.6,
"r_x3": 442.9,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Bbox",
"orig": "Bbox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.8,
"r_y0": 82.5,
"r_x1": 494.9,
"r_y1": 82.5,
"r_x2": 494.9,
"r_y2": 73.6,
"r_x3": 477.8,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Size",
"orig": "Size",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.3,
"r_y0": 82.5,
"r_x1": 536.9,
"r_y1": 82.5,
"r_x2": 536.9,
"r_y2": 73.6,
"r_x3": 508.3,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Format",
"orig": "Format",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 94.9,
"r_x1": 361.6,
"r_y1": 94.9,
"r_x2": 361.6,
"r_y2": 86.0,
"r_x3": 317.1,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 94.9,
"r_x1": 425.4,
"r_y1": 94.9,
"r_x2": 425.4,
"r_y2": 85.7,
"r_x3": 417.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 94.9,
"r_x1": 457.4,
"r_y1": 94.9,
"r_x2": 457.4,
"r_y2": 85.7,
"r_x3": 449.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 94.9,
"r_x1": 496.3,
"r_y1": 94.9,
"r_x2": 496.3,
"r_y2": 86.0,
"r_x3": 476.4,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "509k",
"orig": "509k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 94.9,
"r_x1": 532.6,
"r_y1": 94.9,
"r_x2": 532.6,
"r_y2": 86.0,
"r_x3": 512.6,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 106.8,
"r_x1": 359.4,
"r_y1": 106.8,
"r_x2": 359.4,
"r_y2": 97.9,
"r_x3": 317.1,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 106.8,
"r_x1": 425.4,
"r_y1": 106.8,
"r_x2": 425.4,
"r_y2": 97.6,
"r_x3": 417.9,
"r_y3": 97.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 106.8,
"r_x1": 457.4,
"r_y1": 106.8,
"r_x2": 457.4,
"r_y2": 97.6,
"r_x3": 449.9,
"r_y3": 97.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 106.8,
"r_x1": 496.3,
"r_y1": 106.8,
"r_x2": 496.3,
"r_y2": 97.9,
"r_x3": 476.4,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "112k",
"orig": "112k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.5,
"r_y0": 106.8,
"r_x1": 531.7,
"r_y1": 106.8,
"r_x2": 531.7,
"r_y2": 97.9,
"r_x3": 513.5,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "PDF",
"orig": "PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 118.8,
"r_x1": 360.0,
"r_y1": 118.8,
"r_x2": 360.0,
"r_y2": 109.9,
"r_x3": 317.1,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "TableBank",
"orig": "TableBank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 118.8,
"r_x1": 425.4,
"r_y1": 118.8,
"r_x2": 425.4,
"r_y2": 109.6,
"r_x3": 417.9,
"r_y3": 109.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.8,
"r_y0": 118.8,
"r_x1": 456.5,
"r_y1": 118.8,
"r_x2": 456.5,
"r_y2": 109.6,
"r_x3": 450.8,
"r_y3": 109.6,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 118.8,
"r_x1": 496.3,
"r_y1": 118.8,
"r_x2": 496.3,
"r_y2": 109.9,
"r_x3": 476.4,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "145k",
"orig": "145k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.3,
"r_y0": 118.8,
"r_x1": 533.9,
"r_y1": 118.8,
"r_x2": 533.9,
"r_y2": 109.9,
"r_x3": 511.3,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "JPEG",
"orig": "JPEG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 130.7,
"r_x1": 400.4,
"r_y1": 130.7,
"r_x2": 400.4,
"r_y2": 121.8,
"r_x3": 317.1,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "Combined-Tabnet(*)",
"orig": "Combined-Tabnet(*)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 130.7,
"r_x1": 425.4,
"r_y1": 130.7,
"r_x2": 425.4,
"r_y2": 121.5,
"r_x3": 417.9,
"r_y3": 121.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 130.7,
"r_x1": 457.4,
"r_y1": 130.7,
"r_x2": 457.4,
"r_y2": 121.5,
"r_x3": 449.9,
"r_y3": 121.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 130.7,
"r_x1": 496.3,
"r_y1": 130.7,
"r_x2": 496.3,
"r_y2": 121.8,
"r_x3": 476.4,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "400k",
"orig": "400k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 130.7,
"r_x1": 532.6,
"r_y1": 130.7,
"r_x2": 532.6,
"r_y2": 121.8,
"r_x3": 512.6,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 142.7,
"r_x1": 375.2,
"r_y1": 142.7,
"r_x2": 375.2,
"r_y2": 133.8,
"r_x3": 317.1,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "Combined(**)",
"orig": "Combined(**)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 142.7,
"r_x1": 425.4,
"r_y1": 142.7,
"r_x2": 425.4,
"r_y2": 133.5,
"r_x3": 417.9,
"r_y3": 133.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 142.7,
"r_x1": 457.4,
"r_y1": 142.7,
"r_x2": 457.4,
"r_y2": 133.5,
"r_x3": 449.9,
"r_y3": 133.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 142.7,
"r_x1": 496.3,
"r_y1": 142.7,
"r_x2": 496.3,
"r_y2": 133.8,
"r_x3": 476.4,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "500k",
"orig": "500k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 142.7,
"r_x1": 532.6,
"r_y1": 142.7,
"r_x2": 532.6,
"r_y2": 133.8,
"r_x3": 512.6,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 154.6,
"r_x1": 369.4,
"r_y1": 154.6,
"r_x2": 369.4,
"r_y2": 145.7,
"r_x3": 317.1,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 154.7,
"r_x1": 425.4,
"r_y1": 154.7,
"r_x2": 425.4,
"r_y2": 145.4,
"r_x3": 417.9,
"r_y3": 145.4,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 154.7,
"r_x1": 457.4,
"r_y1": 154.7,
"r_x2": 457.4,
"r_y2": 145.4,
"r_x3": 449.9,
"r_y3": 145.4,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 154.6,
"r_x1": 496.3,
"r_y1": 154.6,
"r_x2": 496.3,
"r_y2": 145.7,
"r_x3": 476.4,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "600k",
"orig": "600k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 154.6,
"r_x1": 532.6,
"r_y1": 154.6,
"r_x2": 532.6,
"r_y2": 145.7,
"r_x3": 512.6,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 17,
"label": "text",
"bbox": {
"l": 412.3,
"t": 73.6,
"r": 430.9,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 412.3,
"r_y0": 82.5,
"r_x1": 430.9,
"r_y1": 82.5,
"r_x2": 430.9,
"r_y2": 73.6,
"r_x3": 412.3,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Tags",
"orig": "Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 18,
"label": "text",
"bbox": {
"l": 442.9,
"t": 73.6,
"r": 464.4,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.9,
"r_y0": 82.5,
"r_x1": 464.4,
"r_y1": 82.5,
"r_x2": 464.4,
"r_y2": 73.6,
"r_x3": 442.9,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Bbox",
"orig": "Bbox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 19,
"label": "text",
"bbox": {
"l": 477.8,
"t": 73.6,
"r": 494.9,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.8,
"r_y0": 82.5,
"r_x1": 494.9,
"r_y1": 82.5,
"r_x2": 494.9,
"r_y2": 73.6,
"r_x3": 477.8,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Size",
"orig": "Size",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 20,
"label": "text",
"bbox": {
"l": 508.3,
"t": 73.6,
"r": 536.9,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.3,
"r_y0": 82.5,
"r_x1": 536.9,
"r_y1": 82.5,
"r_x2": 536.9,
"r_y2": 73.6,
"r_x3": 508.3,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Format",
"orig": "Format",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 21,
"label": "text",
"bbox": {
"l": 317.1,
"t": 86.0,
"r": 361.6,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 94.9,
"r_x1": 361.6,
"r_y1": 94.9,
"r_x2": 361.6,
"r_y2": 86.0,
"r_x3": 317.1,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 22,
"label": "text",
"bbox": {
"l": 417.9,
"t": 85.7,
"r": 425.4,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 94.9,
"r_x1": 425.4,
"r_y1": 94.9,
"r_x2": 425.4,
"r_y2": 85.7,
"r_x3": 417.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 23,
"label": "text",
"bbox": {
"l": 449.9,
"t": 85.7,
"r": 457.4,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 94.9,
"r_x1": 457.4,
"r_y1": 94.9,
"r_x2": 457.4,
"r_y2": 85.7,
"r_x3": 449.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 24,
"label": "text",
"bbox": {
"l": 476.4,
"t": 86.0,
"r": 496.3,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 94.9,
"r_x1": 496.3,
"r_y1": 94.9,
"r_x2": 496.3,
"r_y2": 86.0,
"r_x3": 476.4,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "509k",
"orig": "509k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 25,
"label": "text",
"bbox": {
"l": 512.6,
"t": 86.0,
"r": 532.6,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 94.9,
"r_x1": 532.6,
"r_y1": 94.9,
"r_x2": 532.6,
"r_y2": 86.0,
"r_x3": 512.6,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 26,
"label": "text",
"bbox": {
"l": 317.1,
"t": 97.9,
"r": 359.4,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 106.8,
"r_x1": 359.4,
"r_y1": 106.8,
"r_x2": 359.4,
"r_y2": 97.9,
"r_x3": 317.1,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 27,
"label": "text",
"bbox": {
"l": 417.9,
"t": 97.6,
"r": 425.4,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 106.8,
"r_x1": 425.4,
"r_y1": 106.8,
"r_x2": 425.4,
"r_y2": 97.6,
"r_x3": 417.9,
"r_y3": 97.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 28,
"label": "text",
"bbox": {
"l": 449.9,
"t": 97.6,
"r": 457.4,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 106.8,
"r_x1": 457.4,
"r_y1": 106.8,
"r_x2": 457.4,
"r_y2": 97.6,
"r_x3": 449.9,
"r_y3": 97.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "text",
"bbox": {
"l": 476.4,
"t": 97.9,
"r": 496.3,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 106.8,
"r_x1": 496.3,
"r_y1": 106.8,
"r_x2": 496.3,
"r_y2": 97.9,
"r_x3": 476.4,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "112k",
"orig": "112k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 30,
"label": "text",
"bbox": {
"l": 513.5,
"t": 97.9,
"r": 531.7,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.5,
"r_y0": 106.8,
"r_x1": 531.7,
"r_y1": 106.8,
"r_x2": 531.7,
"r_y2": 97.9,
"r_x3": 513.5,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "PDF",
"orig": "PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "text",
"bbox": {
"l": 317.1,
"t": 109.9,
"r": 360.0,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 118.8,
"r_x1": 360.0,
"r_y1": 118.8,
"r_x2": 360.0,
"r_y2": 109.9,
"r_x3": 317.1,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "TableBank",
"orig": "TableBank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 32,
"label": "text",
"bbox": {
"l": 417.9,
"t": 109.6,
"r": 425.4,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 118.8,
"r_x1": 425.4,
"r_y1": 118.8,
"r_x2": 425.4,
"r_y2": 109.6,
"r_x3": 417.9,
"r_y3": 109.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 33,
"label": "text",
"bbox": {
"l": 450.8,
"t": 109.6,
"r": 456.5,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.8,
"r_y0": 118.8,
"r_x1": 456.5,
"r_y1": 118.8,
"r_x2": 456.5,
"r_y2": 109.6,
"r_x3": 450.8,
"r_y3": 109.6,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 34,
"label": "text",
"bbox": {
"l": 476.4,
"t": 109.9,
"r": 496.3,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 118.8,
"r_x1": 496.3,
"r_y1": 118.8,
"r_x2": 496.3,
"r_y2": 109.9,
"r_x3": 476.4,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "145k",
"orig": "145k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 35,
"label": "text",
"bbox": {
"l": 511.3,
"t": 109.9,
"r": 533.9,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.3,
"r_y0": 118.8,
"r_x1": 533.9,
"r_y1": 118.8,
"r_x2": 533.9,
"r_y2": 109.9,
"r_x3": 511.3,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "JPEG",
"orig": "JPEG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 36,
"label": "text",
"bbox": {
"l": 317.1,
"t": 121.8,
"r": 400.4,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 130.7,
"r_x1": 400.4,
"r_y1": 130.7,
"r_x2": 400.4,
"r_y2": 121.8,
"r_x3": 317.1,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "Combined-Tabnet(*)",
"orig": "Combined-Tabnet(*)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 37,
"label": "text",
"bbox": {
"l": 417.9,
"t": 121.5,
"r": 425.4,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 130.7,
"r_x1": 425.4,
"r_y1": 130.7,
"r_x2": 425.4,
"r_y2": 121.5,
"r_x3": 417.9,
"r_y3": 121.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 38,
"label": "text",
"bbox": {
"l": 449.9,
"t": 121.5,
"r": 457.4,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 130.7,
"r_x1": 457.4,
"r_y1": 130.7,
"r_x2": 457.4,
"r_y2": 121.5,
"r_x3": 449.9,
"r_y3": 121.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 39,
"label": "text",
"bbox": {
"l": 476.4,
"t": 121.8,
"r": 496.3,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 130.7,
"r_x1": 496.3,
"r_y1": 130.7,
"r_x2": 496.3,
"r_y2": 121.8,
"r_x3": 476.4,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "400k",
"orig": "400k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 40,
"label": "text",
"bbox": {
"l": 512.6,
"t": 121.8,
"r": 532.6,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 130.7,
"r_x1": 532.6,
"r_y1": 130.7,
"r_x2": 532.6,
"r_y2": 121.8,
"r_x3": 512.6,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 317.1,
"t": 133.8,
"r": 375.2,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 142.7,
"r_x1": 375.2,
"r_y1": 142.7,
"r_x2": 375.2,
"r_y2": 133.8,
"r_x3": 317.1,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "Combined(**)",
"orig": "Combined(**)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 417.9,
"t": 133.5,
"r": 425.4,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 142.7,
"r_x1": 425.4,
"r_y1": 142.7,
"r_x2": 425.4,
"r_y2": 133.5,
"r_x3": 417.9,
"r_y3": 133.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 449.9,
"t": 133.5,
"r": 457.4,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 142.7,
"r_x1": 457.4,
"r_y1": 142.7,
"r_x2": 457.4,
"r_y2": 133.5,
"r_x3": 449.9,
"r_y3": 133.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 476.4,
"t": 133.8,
"r": 496.3,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 142.7,
"r_x1": 496.3,
"r_y1": 142.7,
"r_x2": 496.3,
"r_y2": 133.8,
"r_x3": 476.4,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "500k",
"orig": "500k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 512.6,
"t": 133.8,
"r": 532.6,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 142.7,
"r_x1": 532.6,
"r_y1": 142.7,
"r_x2": 532.6,
"r_y2": 133.8,
"r_x3": 512.6,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 317.1,
"t": 145.7,
"r": 369.4,
"b": 154.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 154.6,
"r_x1": 369.4,
"r_y1": 154.6,
"r_x2": 369.4,
"r_y2": 145.7,
"r_x3": 317.1,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 417.9,
"t": 145.4,
"r": 425.4,
"b": 154.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 154.7,
"r_x1": 425.4,
"r_y1": 154.7,
"r_x2": 425.4,
"r_y2": 145.4,
"r_x3": 417.9,
"r_y3": 145.4,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 449.9,
"t": 145.4,
"r": 457.4,
"b": 154.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 154.7,
"r_x1": 457.4,
"r_y1": 154.7,
"r_x2": 457.4,
"r_y2": 145.4,
"r_x3": 449.9,
"r_y3": 145.4,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 476.4,
"t": 145.7,
"r": 496.3,
"b": 154.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 154.6,
"r_x1": 496.3,
"r_y1": 154.6,
"r_x2": 496.3,
"r_y2": 145.7,
"r_x3": 476.4,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "600k",
"orig": "600k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 512.6,
"t": 145.7,
"r": 532.6,
"b": 154.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 154.6,
"r_x1": 532.6,
"r_y1": 154.6,
"r_x2": 532.6,
"r_y2": 145.7,
"r_x3": 512.6,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 9,
"label": "caption",
"bbox": {
"l": 308.9,
"t": 167.7,
"r": 545.1,
"b": 224.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 176.6,
"r_x1": 344.6,
"r_y1": 176.6,
"r_x2": 344.6,
"r_y2": 167.7,
"r_x3": 308.9,
"r_y3": 167.7,
"coord_origin": "TOPLEFT"
},
"text": "Table 1:",
"orig": "Table 1:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 361.1,
"r_y0": 176.6,
"r_x1": 380.5,
"r_y1": 176.6,
"r_x2": 380.5,
"r_y2": 167.7,
"r_x3": 361.1,
"r_y3": 167.7,
"coord_origin": "TOPLEFT"
},
"text": "Both",
"orig": "Both",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 386.6,
"r_y0": 176.3,
"r_x1": 468.7,
"r_y1": 176.3,
"r_x2": 468.7,
"r_y2": 167.8,
"r_x3": 386.6,
"r_y3": 167.8,
"coord_origin": "TOPLEFT"
},
"text": "\u201cCombined-Tabnet\u201d",
"orig": "\u201cCombined-Tabnet\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 474.8,
"r_y0": 176.6,
"r_x1": 489.2,
"r_y1": 176.6,
"r_x2": 489.2,
"r_y2": 167.7,
"r_x3": 474.8,
"r_y3": 167.7,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 495.3,
"r_y0": 176.3,
"r_x1": 545.1,
"r_y1": 176.3,
"r_x2": 545.1,
"r_y2": 167.8,
"r_x3": 495.3,
"r_y3": 167.8,
"coord_origin": "TOPLEFT"
},
"text": "\u201dCombined-",
"orig": "\u201dCombined-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 188.3,
"r_x1": 341.2,
"r_y1": 188.3,
"r_x2": 341.2,
"r_y2": 179.7,
"r_x3": 308.9,
"r_y3": 179.7,
"coord_origin": "TOPLEFT"
},
"text": "Tabnet\u201d",
"orig": "Tabnet\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 343.5,
"r_y0": 188.5,
"r_x1": 545.1,
"r_y1": 188.5,
"r_x2": 545.1,
"r_y2": 179.6,
"r_x3": 343.5,
"r_y3": 179.6,
"coord_origin": "TOPLEFT"
},
"text": "are variations of the following: (*) The Combined-",
"orig": "are variations of the following: (*) The Combined-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 200.5,
"r_x1": 545.1,
"r_y1": 200.5,
"r_x2": 545.1,
"r_y2": 191.6,
"r_x3": 308.9,
"r_y3": 191.6,
"coord_origin": "TOPLEFT"
},
"text": "Tabnet dataset is the processed combination of PubTabNet",
"orig": "Tabnet dataset is the processed combination of PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 212.4,
"r_x1": 545.1,
"r_y1": 212.4,
"r_x2": 545.1,
"r_y2": 203.5,
"r_x3": 308.9,
"r_y3": 203.5,
"coord_origin": "TOPLEFT"
},
"text": "and Fintabnet. (**) The combined dataset is the processed",
"orig": "and Fintabnet. (**) The combined dataset is the processed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 224.4,
"r_x1": 523.9,
"r_y1": 224.4,
"r_x2": 523.9,
"r_y2": 215.5,
"r_x3": 308.9,
"r_y3": 215.5,
"coord_origin": "TOPLEFT"
},
"text": "combination of PubTabNet, Fintabnet and TableBank.",
"orig": "combination of PubTabNet, Fintabnet and TableBank.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 6,
"label": "text",
"bbox": {
"l": 308.9,
"t": 249.6,
"r": 545.1,
"b": 294.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 258.5,
"r_x1": 545.1,
"r_y1": 258.5,
"r_x2": 545.1,
"r_y2": 249.6,
"r_x3": 308.9,
"r_y3": 249.6,
"coord_origin": "TOPLEFT"
},
"text": "one adopts a colorful appearance with high contrast and the",
"orig": "one adopts a colorful appearance with high contrast and the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 270.5,
"r_x1": 545.1,
"r_y1": 270.5,
"r_x2": 545.1,
"r_y2": 261.6,
"r_x3": 308.9,
"r_y3": 261.6,
"coord_origin": "TOPLEFT"
},
"text": "last one contains tables with sparse content. Lastly, we have",
"orig": "last one contains tables with sparse content. Lastly, we have",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 282.4,
"r_x1": 545.1,
"r_y1": 282.4,
"r_x2": 545.1,
"r_y2": 273.5,
"r_x3": 308.9,
"r_y3": 273.5,
"coord_origin": "TOPLEFT"
},
"text": "combined all synthetic datasets into one big unified syn-",
"orig": "combined all synthetic datasets into one big unified syn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 294.4,
"r_x1": 436.8,
"r_y1": 294.4,
"r_x2": 436.8,
"r_y2": 285.5,
"r_x3": 308.9,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "thetic dataset of 600k examples.",
"orig": "thetic dataset of 600k examples.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 13,
"label": "text",
"bbox": {
"l": 320.8,
"t": 297.8,
"r": 542.7,
"b": 306.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 306.7,
"r_x1": 542.7,
"r_y1": 306.7,
"r_x2": 542.7,
"r_y2": 297.8,
"r_x3": 320.8,
"r_y3": 297.8,
"coord_origin": "TOPLEFT"
},
"text": "Tab. 1 summarizes the various attributes of the datasets.",
"orig": "Tab. 1 summarizes the various attributes of the datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 11,
"label": "section_header",
"bbox": {
"l": 308.9,
"t": 321.2,
"r": 444.9,
"b": 331.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 331.9,
"r_x1": 316.3,
"r_y1": 331.9,
"r_x2": 316.3,
"r_y2": 321.2,
"r_x3": 308.9,
"r_y3": 321.2,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.2,
"r_y0": 331.9,
"r_x1": 444.9,
"r_y1": 331.9,
"r_x2": 444.9,
"r_y2": 321.2,
"r_x3": 326.2,
"r_y3": 321.2,
"coord_origin": "TOPLEFT"
},
"text": "The TableFormer model",
"orig": "The TableFormer model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 0,
"label": "text",
"bbox": {
"l": 308.9,
"t": 341.9,
"r": 545.1,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 350.8,
"r_x1": 545.1,
"r_y1": 350.8,
"r_x2": 545.1,
"r_y2": 341.9,
"r_x3": 320.8,
"r_y3": 341.9,
"coord_origin": "TOPLEFT"
},
"text": "Given the image of a table, TableFormer is able to pre-",
"orig": "Given the image of a table, TableFormer is able to pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 362.8,
"r_x1": 545.1,
"r_y1": 362.8,
"r_x2": 545.1,
"r_y2": 353.9,
"r_x3": 308.9,
"r_y3": 353.9,
"coord_origin": "TOPLEFT"
},
"text": "dict: 1) a sequence of tokens that represent the structure of",
"orig": "dict: 1) a sequence of tokens that represent the structure of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 374.8,
"r_x1": 545.1,
"r_y1": 374.8,
"r_x2": 545.1,
"r_y2": 365.8,
"r_x3": 308.9,
"r_y3": 365.8,
"coord_origin": "TOPLEFT"
},
"text": "a table, and 2) a bounding box coupled to a subset of those",
"orig": "a table, and 2) a bounding box coupled to a subset of those",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 386.7,
"r_x1": 545.1,
"r_y1": 386.7,
"r_x2": 545.1,
"r_y2": 377.8,
"r_x3": 308.9,
"r_y3": 377.8,
"coord_origin": "TOPLEFT"
},
"text": "tokens. The conversion of an image into a sequence of to-",
"orig": "tokens. The conversion of an image into a sequence of to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 398.7,
"r_x1": 545.1,
"r_y1": 398.7,
"r_x2": 545.1,
"r_y2": 389.8,
"r_x3": 308.9,
"r_y3": 389.8,
"coord_origin": "TOPLEFT"
},
"text": "kens is a well-known task [35, 16]. While attention is often",
"orig": "kens is a well-known task [35, 16]. While attention is often",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 410.6,
"r_x1": 545.1,
"r_y1": 410.6,
"r_x2": 545.1,
"r_y2": 401.7,
"r_x3": 308.9,
"r_y3": 401.7,
"coord_origin": "TOPLEFT"
},
"text": "used as an implicit method to associate each token of the",
"orig": "used as an implicit method to associate each token of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 422.6,
"r_x1": 545.1,
"r_y1": 422.6,
"r_x2": 545.1,
"r_y2": 413.7,
"r_x3": 308.9,
"r_y3": 413.7,
"coord_origin": "TOPLEFT"
},
"text": "sequence with a position in the original image, an explicit",
"orig": "sequence with a position in the original image, an explicit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 434.5,
"r_x1": 545.1,
"r_y1": 434.5,
"r_x2": 545.1,
"r_y2": 425.6,
"r_x3": 308.9,
"r_y3": 425.6,
"coord_origin": "TOPLEFT"
},
"text": "association between the individual table-cells and the image",
"orig": "association between the individual table-cells and the image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 446.5,
"r_x1": 437.9,
"r_y1": 446.5,
"r_x2": 437.9,
"r_y2": 437.6,
"r_x3": 308.9,
"r_y3": 437.6,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes is also required.",
"orig": "bounding boxes is also required.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 12,
"label": "section_header",
"bbox": {
"l": 308.9,
"t": 457.7,
"r": 420.2,
"b": 467.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 467.5,
"r_x1": 323.1,
"r_y1": 467.5,
"r_x2": 323.1,
"r_y2": 457.7,
"r_x3": 308.9,
"r_y3": 457.7,
"coord_origin": "TOPLEFT"
},
"text": "4.1.",
"orig": "4.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 332.7,
"r_y0": 467.5,
"r_x1": 420.2,
"r_y1": 467.5,
"r_x2": 420.2,
"r_y2": 457.7,
"r_x3": 332.7,
"r_y3": 457.7,
"coord_origin": "TOPLEFT"
},
"text": "Model architecture.",
"orig": "Model architecture.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "text",
"bbox": {
"l": 308.9,
"t": 476.8,
"r": 545.1,
"b": 665.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 485.7,
"r_x1": 545.1,
"r_y1": 485.7,
"r_x2": 545.1,
"r_y2": 476.8,
"r_x3": 320.8,
"r_y3": 476.8,
"coord_origin": "TOPLEFT"
},
"text": "We now describe in detail the proposed method, which",
"orig": "We now describe in detail the proposed method, which",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 497.6,
"r_x1": 509.0,
"r_y1": 497.6,
"r_x2": 509.0,
"r_y2": 488.7,
"r_x3": 308.9,
"r_y3": 488.7,
"coord_origin": "TOPLEFT"
},
"text": "is composed of three main components, see Fig.",
"orig": "is composed of three main components, see Fig.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.6,
"r_y0": 497.6,
"r_x1": 523.1,
"r_y1": 497.6,
"r_x2": 523.1,
"r_y2": 488.7,
"r_x3": 515.6,
"r_y3": 488.7,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 529.6,
"r_y0": 497.6,
"r_x1": 545.1,
"r_y1": 497.6,
"r_x2": 545.1,
"r_y2": 488.7,
"r_x3": 529.6,
"r_y3": 488.7,
"coord_origin": "TOPLEFT"
},
"text": "Our",
"orig": "Our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 509.4,
"r_x1": 406.3,
"r_y1": 509.4,
"r_x2": 406.3,
"r_y2": 500.8,
"r_x3": 308.9,
"r_y3": 500.8,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network",
"orig": "CNN Backbone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.9,
"r_y0": 509.6,
"r_x1": 545.1,
"r_y1": 509.6,
"r_x2": 545.1,
"r_y2": 500.7,
"r_x3": 408.9,
"r_y3": 500.7,
"coord_origin": "TOPLEFT"
},
"text": "encodes the input as a feature vec-",
"orig": "encodes the input as a feature vec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 521.5,
"r_x1": 409.4,
"r_y1": 521.5,
"r_x2": 409.4,
"r_y2": 512.6,
"r_x3": 308.9,
"r_y3": 512.6,
"coord_origin": "TOPLEFT"
},
"text": "tor of predefined length.",
"orig": "tor of predefined length.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 416.7,
"r_y0": 521.5,
"r_x1": 545.1,
"r_y1": 521.5,
"r_x2": 545.1,
"r_y2": 512.6,
"r_x3": 416.7,
"r_y3": 512.6,
"coord_origin": "TOPLEFT"
},
"text": "The input feature vector of the",
"orig": "The input feature vector of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 533.5,
"r_x1": 436.2,
"r_y1": 533.5,
"r_x2": 436.2,
"r_y2": 524.6,
"r_x3": 308.9,
"r_y3": 524.6,
"coord_origin": "TOPLEFT"
},
"text": "encoded image is passed to the",
"orig": "encoded image is passed to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 439.5,
"r_y0": 533.3,
"r_x1": 513.9,
"r_y1": 533.3,
"r_x2": 513.9,
"r_y2": 524.7,
"r_x3": 439.5,
"r_y3": 524.7,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 517.4,
"r_y0": 533.5,
"r_x1": 545.1,
"r_y1": 533.5,
"r_x2": 545.1,
"r_y2": 524.6,
"r_x3": 517.4,
"r_y3": 524.6,
"coord_origin": "TOPLEFT"
},
"text": "to pro-",
"orig": "to pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 545.4,
"r_x1": 545.1,
"r_y1": 545.4,
"r_x2": 545.1,
"r_y2": 536.5,
"r_x3": 308.9,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "duce a sequence of HTML tags that represent the structure",
"orig": "duce a sequence of HTML tags that represent the structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 557.4,
"r_x1": 358.5,
"r_y1": 557.4,
"r_x2": 358.5,
"r_y2": 548.5,
"r_x3": 308.9,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "of the table.",
"orig": "of the table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 365.2,
"r_y0": 557.4,
"r_x1": 545.1,
"r_y1": 557.4,
"r_x2": 545.1,
"r_y2": 548.5,
"r_x3": 365.2,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "With each prediction of an HTML standard",
"orig": "With each prediction of an HTML standard",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 569.4,
"r_x1": 352.4,
"r_y1": 569.4,
"r_x2": 352.4,
"r_y2": 560.5,
"r_x3": 308.9,
"r_y3": 560.5,
"coord_origin": "TOPLEFT"
},
"text": "data cell (\u2018",
"orig": "data cell (\u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.4,
"r_y0": 569.1,
"r_x1": 360.2,
"r_y1": 569.1,
"r_x2": 360.2,
"r_y2": 560.3,
"r_x3": 352.4,
"r_y3": 560.3,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.2,
"r_y0": 569.4,
"r_x1": 367.9,
"r_y1": 569.4,
"r_x2": 367.9,
"r_y2": 560.5,
"r_x3": 360.2,
"r_y3": 560.5,
"coord_origin": "TOPLEFT"
},
"text": "td",
"orig": "td",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.9,
"r_y0": 569.1,
"r_x1": 375.7,
"r_y1": 569.1,
"r_x2": 375.7,
"r_y2": 560.3,
"r_x3": 367.9,
"r_y3": 560.3,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 375.7,
"r_y0": 569.4,
"r_x1": 545.1,
"r_y1": 569.4,
"r_x2": 545.1,
"r_y2": 560.5,
"r_x3": 375.7,
"r_y3": 560.5,
"coord_origin": "TOPLEFT"
},
"text": "\u2019) the hidden state of that cell is passed to",
"orig": "\u2019) the hidden state of that cell is passed to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 581.3,
"r_x1": 545.1,
"r_y1": 581.3,
"r_x2": 545.1,
"r_y2": 572.4,
"r_x3": 308.9,
"r_y3": 572.4,
"coord_origin": "TOPLEFT"
},
"text": "the Cell BBox Decoder. As for spanning cells, such as row",
"orig": "the Cell BBox Decoder. As for spanning cells, such as row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 593.3,
"r_x1": 483.1,
"r_y1": 593.3,
"r_x2": 483.1,
"r_y2": 584.4,
"r_x3": 308.9,
"r_y3": 584.4,
"coord_origin": "TOPLEFT"
},
"text": "or column span, the tag is broken down to \u2018",
"orig": "or column span, the tag is broken down to \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.1,
"r_y0": 593.0,
"r_x1": 490.9,
"r_y1": 593.0,
"r_x2": 490.9,
"r_y2": 584.2,
"r_x3": 483.1,
"r_y3": 584.2,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.9,
"r_y0": 593.3,
"r_x1": 545.1,
"r_y1": 593.3,
"r_x2": 545.1,
"r_y2": 584.4,
"r_x3": 490.9,
"r_y3": 584.4,
"coord_origin": "TOPLEFT"
},
"text": "\u2019, \u2018rowspan=\u2019",
"orig": "\u2019, \u2018rowspan=\u2019",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 605.2,
"r_x1": 545.1,
"r_y1": 605.2,
"r_x2": 545.1,
"r_y2": 596.3,
"r_x3": 308.9,
"r_y3": 596.3,
"coord_origin": "TOPLEFT"
},
"text": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),",
"orig": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 617.2,
"r_x1": 329.6,
"r_y1": 617.2,
"r_x2": 329.6,
"r_y2": 608.3,
"r_x3": 308.9,
"r_y3": 608.3,
"coord_origin": "TOPLEFT"
},
"text": "and \u2018",
"orig": "and \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.6,
"r_y0": 617.0,
"r_x1": 337.4,
"r_y1": 617.0,
"r_x2": 337.4,
"r_y2": 608.1,
"r_x3": 329.6,
"r_y3": 608.1,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 337.4,
"r_y0": 617.2,
"r_x1": 468.6,
"r_y1": 617.2,
"r_x2": 468.6,
"r_y2": 608.3,
"r_x3": 337.4,
"r_y3": 608.3,
"coord_origin": "TOPLEFT"
},
"text": "\u2019. The hidden state attached to \u2018",
"orig": "\u2019. The hidden state attached to \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.6,
"r_y0": 617.0,
"r_x1": 476.3,
"r_y1": 617.0,
"r_x2": 476.3,
"r_y2": 608.1,
"r_x3": 468.6,
"r_y3": 608.1,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.3,
"r_y0": 617.2,
"r_x1": 545.1,
"r_y1": 617.2,
"r_x2": 545.1,
"r_y2": 608.3,
"r_x3": 476.3,
"r_y3": 608.3,
"coord_origin": "TOPLEFT"
},
"text": "\u2019 is passed to the",
"orig": "\u2019 is passed to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 629.1,
"r_x1": 545.1,
"r_y1": 629.1,
"r_x2": 545.1,
"r_y2": 620.2,
"r_x3": 308.9,
"r_y3": 620.2,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder. A shared feed forward network (FFN)",
"orig": "Cell BBox Decoder. A shared feed forward network (FFN)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 641.1,
"r_x1": 545.1,
"r_y1": 641.1,
"r_x2": 545.1,
"r_y2": 632.2,
"r_x3": 308.9,
"r_y3": 632.2,
"coord_origin": "TOPLEFT"
},
"text": "receives the hidden states from the Structure Decoder, to",
"orig": "receives the hidden states from the Structure Decoder, to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 653.0,
"r_x1": 545.1,
"r_y1": 653.0,
"r_x2": 545.1,
"r_y2": 644.1,
"r_x3": 308.9,
"r_y3": 644.1,
"coord_origin": "TOPLEFT"
},
"text": "provide the final detection predictions of the bounding box",
"orig": "provide the final detection predictions of the bounding box",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 665.0,
"r_x1": 449.4,
"r_y1": 665.0,
"r_x2": 449.4,
"r_y2": 656.1,
"r_x3": 308.9,
"r_y3": 656.1,
"coord_origin": "TOPLEFT"
},
"text": "coordinates and their classification.",
"orig": "coordinates and their classification.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 7,
"label": "text",
"bbox": {
"l": 308.9,
"t": 668.3,
"r": 545.1,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 677.2,
"r_x1": 431.9,
"r_y1": 677.2,
"r_x2": 431.9,
"r_y2": 668.3,
"r_x3": 320.8,
"r_y3": 668.3,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network.",
"orig": "CNN Backbone Network.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 439.5,
"r_y0": 677.3,
"r_x1": 545.1,
"r_y1": 677.3,
"r_x2": 545.1,
"r_y2": 668.4,
"r_x3": 439.5,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "A ResNet-18 CNN is the",
"orig": "A ResNet-18 CNN is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 689.2,
"r_x1": 545.1,
"r_y1": 689.2,
"r_x2": 545.1,
"r_y2": 680.3,
"r_x3": 308.9,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "backbone that receives the table image and encodes it as a",
"orig": "backbone that receives the table image and encodes it as a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 308.9,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "vector of predefined length. The network has been modified",
"orig": "vector of predefined length. The network has been modified",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 545.1,
"r_y1": 713.2,
"r_x2": 545.1,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "by removing the linear and pooling layer, as we are not per-",
"orig": "by removing the linear and pooling layer, as we are not per-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 14,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.86,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"tablestructure": {
"table_map": {
"8": {
"label": "table",
"id": 8,
"page_no": 3,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 310.7,
"t": 73.2,
"r": 543.0,
"b": 155.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 412.3,
"r_y0": 82.5,
"r_x1": 430.9,
"r_y1": 82.5,
"r_x2": 430.9,
"r_y2": 73.6,
"r_x3": 412.3,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Tags",
"orig": "Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.9,
"r_y0": 82.5,
"r_x1": 464.4,
"r_y1": 82.5,
"r_x2": 464.4,
"r_y2": 73.6,
"r_x3": 442.9,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Bbox",
"orig": "Bbox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.8,
"r_y0": 82.5,
"r_x1": 494.9,
"r_y1": 82.5,
"r_x2": 494.9,
"r_y2": 73.6,
"r_x3": 477.8,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Size",
"orig": "Size",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.3,
"r_y0": 82.5,
"r_x1": 536.9,
"r_y1": 82.5,
"r_x2": 536.9,
"r_y2": 73.6,
"r_x3": 508.3,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Format",
"orig": "Format",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 94.9,
"r_x1": 361.6,
"r_y1": 94.9,
"r_x2": 361.6,
"r_y2": 86.0,
"r_x3": 317.1,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 94.9,
"r_x1": 425.4,
"r_y1": 94.9,
"r_x2": 425.4,
"r_y2": 85.7,
"r_x3": 417.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 94.9,
"r_x1": 457.4,
"r_y1": 94.9,
"r_x2": 457.4,
"r_y2": 85.7,
"r_x3": 449.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 94.9,
"r_x1": 496.3,
"r_y1": 94.9,
"r_x2": 496.3,
"r_y2": 86.0,
"r_x3": 476.4,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "509k",
"orig": "509k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 94.9,
"r_x1": 532.6,
"r_y1": 94.9,
"r_x2": 532.6,
"r_y2": 86.0,
"r_x3": 512.6,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 106.8,
"r_x1": 359.4,
"r_y1": 106.8,
"r_x2": 359.4,
"r_y2": 97.9,
"r_x3": 317.1,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 106.8,
"r_x1": 425.4,
"r_y1": 106.8,
"r_x2": 425.4,
"r_y2": 97.6,
"r_x3": 417.9,
"r_y3": 97.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 106.8,
"r_x1": 457.4,
"r_y1": 106.8,
"r_x2": 457.4,
"r_y2": 97.6,
"r_x3": 449.9,
"r_y3": 97.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 106.8,
"r_x1": 496.3,
"r_y1": 106.8,
"r_x2": 496.3,
"r_y2": 97.9,
"r_x3": 476.4,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "112k",
"orig": "112k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.5,
"r_y0": 106.8,
"r_x1": 531.7,
"r_y1": 106.8,
"r_x2": 531.7,
"r_y2": 97.9,
"r_x3": 513.5,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "PDF",
"orig": "PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 118.8,
"r_x1": 360.0,
"r_y1": 118.8,
"r_x2": 360.0,
"r_y2": 109.9,
"r_x3": 317.1,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "TableBank",
"orig": "TableBank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 118.8,
"r_x1": 425.4,
"r_y1": 118.8,
"r_x2": 425.4,
"r_y2": 109.6,
"r_x3": 417.9,
"r_y3": 109.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.8,
"r_y0": 118.8,
"r_x1": 456.5,
"r_y1": 118.8,
"r_x2": 456.5,
"r_y2": 109.6,
"r_x3": 450.8,
"r_y3": 109.6,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 118.8,
"r_x1": 496.3,
"r_y1": 118.8,
"r_x2": 496.3,
"r_y2": 109.9,
"r_x3": 476.4,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "145k",
"orig": "145k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.3,
"r_y0": 118.8,
"r_x1": 533.9,
"r_y1": 118.8,
"r_x2": 533.9,
"r_y2": 109.9,
"r_x3": 511.3,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "JPEG",
"orig": "JPEG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 130.7,
"r_x1": 400.4,
"r_y1": 130.7,
"r_x2": 400.4,
"r_y2": 121.8,
"r_x3": 317.1,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "Combined-Tabnet(*)",
"orig": "Combined-Tabnet(*)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 130.7,
"r_x1": 425.4,
"r_y1": 130.7,
"r_x2": 425.4,
"r_y2": 121.5,
"r_x3": 417.9,
"r_y3": 121.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 130.7,
"r_x1": 457.4,
"r_y1": 130.7,
"r_x2": 457.4,
"r_y2": 121.5,
"r_x3": 449.9,
"r_y3": 121.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 130.7,
"r_x1": 496.3,
"r_y1": 130.7,
"r_x2": 496.3,
"r_y2": 121.8,
"r_x3": 476.4,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "400k",
"orig": "400k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 130.7,
"r_x1": 532.6,
"r_y1": 130.7,
"r_x2": 532.6,
"r_y2": 121.8,
"r_x3": 512.6,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 142.7,
"r_x1": 375.2,
"r_y1": 142.7,
"r_x2": 375.2,
"r_y2": 133.8,
"r_x3": 317.1,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "Combined(**)",
"orig": "Combined(**)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 142.7,
"r_x1": 425.4,
"r_y1": 142.7,
"r_x2": 425.4,
"r_y2": 133.5,
"r_x3": 417.9,
"r_y3": 133.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 142.7,
"r_x1": 457.4,
"r_y1": 142.7,
"r_x2": 457.4,
"r_y2": 133.5,
"r_x3": 449.9,
"r_y3": 133.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 142.7,
"r_x1": 496.3,
"r_y1": 142.7,
"r_x2": 496.3,
"r_y2": 133.8,
"r_x3": 476.4,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "500k",
"orig": "500k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 142.7,
"r_x1": 532.6,
"r_y1": 142.7,
"r_x2": 532.6,
"r_y2": 133.8,
"r_x3": 512.6,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 154.6,
"r_x1": 369.4,
"r_y1": 154.6,
"r_x2": 369.4,
"r_y2": 145.7,
"r_x3": 317.1,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 154.7,
"r_x1": 425.4,
"r_y1": 154.7,
"r_x2": 425.4,
"r_y2": 145.4,
"r_x3": 417.9,
"r_y3": 145.4,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 154.7,
"r_x1": 457.4,
"r_y1": 154.7,
"r_x2": 457.4,
"r_y2": 145.4,
"r_x3": 449.9,
"r_y3": 145.4,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 154.6,
"r_x1": 496.3,
"r_y1": 154.6,
"r_x2": 496.3,
"r_y2": 145.7,
"r_x3": 476.4,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "600k",
"orig": "600k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 154.6,
"r_x1": 532.6,
"r_y1": 154.6,
"r_x2": 532.6,
"r_y2": 145.7,
"r_x3": 512.6,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 17,
"label": "text",
"bbox": {
"l": 412.3,
"t": 73.6,
"r": 430.9,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 412.3,
"r_y0": 82.5,
"r_x1": 430.9,
"r_y1": 82.5,
"r_x2": 430.9,
"r_y2": 73.6,
"r_x3": 412.3,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Tags",
"orig": "Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 18,
"label": "text",
"bbox": {
"l": 442.9,
"t": 73.6,
"r": 464.4,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.9,
"r_y0": 82.5,
"r_x1": 464.4,
"r_y1": 82.5,
"r_x2": 464.4,
"r_y2": 73.6,
"r_x3": 442.9,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Bbox",
"orig": "Bbox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 19,
"label": "text",
"bbox": {
"l": 477.8,
"t": 73.6,
"r": 494.9,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.8,
"r_y0": 82.5,
"r_x1": 494.9,
"r_y1": 82.5,
"r_x2": 494.9,
"r_y2": 73.6,
"r_x3": 477.8,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Size",
"orig": "Size",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 20,
"label": "text",
"bbox": {
"l": 508.3,
"t": 73.6,
"r": 536.9,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.3,
"r_y0": 82.5,
"r_x1": 536.9,
"r_y1": 82.5,
"r_x2": 536.9,
"r_y2": 73.6,
"r_x3": 508.3,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Format",
"orig": "Format",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 21,
"label": "text",
"bbox": {
"l": 317.1,
"t": 86.0,
"r": 361.6,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 94.9,
"r_x1": 361.6,
"r_y1": 94.9,
"r_x2": 361.6,
"r_y2": 86.0,
"r_x3": 317.1,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 22,
"label": "text",
"bbox": {
"l": 417.9,
"t": 85.7,
"r": 425.4,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 94.9,
"r_x1": 425.4,
"r_y1": 94.9,
"r_x2": 425.4,
"r_y2": 85.7,
"r_x3": 417.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 23,
"label": "text",
"bbox": {
"l": 449.9,
"t": 85.7,
"r": 457.4,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 94.9,
"r_x1": 457.4,
"r_y1": 94.9,
"r_x2": 457.4,
"r_y2": 85.7,
"r_x3": 449.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 24,
"label": "text",
"bbox": {
"l": 476.4,
"t": 86.0,
"r": 496.3,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 94.9,
"r_x1": 496.3,
"r_y1": 94.9,
"r_x2": 496.3,
"r_y2": 86.0,
"r_x3": 476.4,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "509k",
"orig": "509k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 25,
"label": "text",
"bbox": {
"l": 512.6,
"t": 86.0,
"r": 532.6,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 94.9,
"r_x1": 532.6,
"r_y1": 94.9,
"r_x2": 532.6,
"r_y2": 86.0,
"r_x3": 512.6,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 26,
"label": "text",
"bbox": {
"l": 317.1,
"t": 97.9,
"r": 359.4,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 106.8,
"r_x1": 359.4,
"r_y1": 106.8,
"r_x2": 359.4,
"r_y2": 97.9,
"r_x3": 317.1,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 27,
"label": "text",
"bbox": {
"l": 417.9,
"t": 97.6,
"r": 425.4,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 106.8,
"r_x1": 425.4,
"r_y1": 106.8,
"r_x2": 425.4,
"r_y2": 97.6,
"r_x3": 417.9,
"r_y3": 97.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 28,
"label": "text",
"bbox": {
"l": 449.9,
"t": 97.6,
"r": 457.4,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 106.8,
"r_x1": 457.4,
"r_y1": 106.8,
"r_x2": 457.4,
"r_y2": 97.6,
"r_x3": 449.9,
"r_y3": 97.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "text",
"bbox": {
"l": 476.4,
"t": 97.9,
"r": 496.3,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 106.8,
"r_x1": 496.3,
"r_y1": 106.8,
"r_x2": 496.3,
"r_y2": 97.9,
"r_x3": 476.4,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "112k",
"orig": "112k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 30,
"label": "text",
"bbox": {
"l": 513.5,
"t": 97.9,
"r": 531.7,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.5,
"r_y0": 106.8,
"r_x1": 531.7,
"r_y1": 106.8,
"r_x2": 531.7,
"r_y2": 97.9,
"r_x3": 513.5,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "PDF",
"orig": "PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "text",
"bbox": {
"l": 317.1,
"t": 109.9,
"r": 360.0,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 118.8,
"r_x1": 360.0,
"r_y1": 118.8,
"r_x2": 360.0,
"r_y2": 109.9,
"r_x3": 317.1,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "TableBank",
"orig": "TableBank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 32,
"label": "text",
"bbox": {
"l": 417.9,
"t": 109.6,
"r": 425.4,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 118.8,
"r_x1": 425.4,
"r_y1": 118.8,
"r_x2": 425.4,
"r_y2": 109.6,
"r_x3": 417.9,
"r_y3": 109.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 33,
"label": "text",
"bbox": {
"l": 450.8,
"t": 109.6,
"r": 456.5,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.8,
"r_y0": 118.8,
"r_x1": 456.5,
"r_y1": 118.8,
"r_x2": 456.5,
"r_y2": 109.6,
"r_x3": 450.8,
"r_y3": 109.6,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 34,
"label": "text",
"bbox": {
"l": 476.4,
"t": 109.9,
"r": 496.3,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 118.8,
"r_x1": 496.3,
"r_y1": 118.8,
"r_x2": 496.3,
"r_y2": 109.9,
"r_x3": 476.4,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "145k",
"orig": "145k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 35,
"label": "text",
"bbox": {
"l": 511.3,
"t": 109.9,
"r": 533.9,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.3,
"r_y0": 118.8,
"r_x1": 533.9,
"r_y1": 118.8,
"r_x2": 533.9,
"r_y2": 109.9,
"r_x3": 511.3,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "JPEG",
"orig": "JPEG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 36,
"label": "text",
"bbox": {
"l": 317.1,
"t": 121.8,
"r": 400.4,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 130.7,
"r_x1": 400.4,
"r_y1": 130.7,
"r_x2": 400.4,
"r_y2": 121.8,
"r_x3": 317.1,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "Combined-Tabnet(*)",
"orig": "Combined-Tabnet(*)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 37,
"label": "text",
"bbox": {
"l": 417.9,
"t": 121.5,
"r": 425.4,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 130.7,
"r_x1": 425.4,
"r_y1": 130.7,
"r_x2": 425.4,
"r_y2": 121.5,
"r_x3": 417.9,
"r_y3": 121.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 38,
"label": "text",
"bbox": {
"l": 449.9,
"t": 121.5,
"r": 457.4,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 130.7,
"r_x1": 457.4,
"r_y1": 130.7,
"r_x2": 457.4,
"r_y2": 121.5,
"r_x3": 449.9,
"r_y3": 121.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 39,
"label": "text",
"bbox": {
"l": 476.4,
"t": 121.8,
"r": 496.3,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 130.7,
"r_x1": 496.3,
"r_y1": 130.7,
"r_x2": 496.3,
"r_y2": 121.8,
"r_x3": 476.4,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "400k",
"orig": "400k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 40,
"label": "text",
"bbox": {
"l": 512.6,
"t": 121.8,
"r": 532.6,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 130.7,
"r_x1": 532.6,
"r_y1": 130.7,
"r_x2": 532.6,
"r_y2": 121.8,
"r_x3": 512.6,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 317.1,
"t": 133.8,
"r": 375.2,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 142.7,
"r_x1": 375.2,
"r_y1": 142.7,
"r_x2": 375.2,
"r_y2": 133.8,
"r_x3": 317.1,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "Combined(**)",
"orig": "Combined(**)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 417.9,
"t": 133.5,
"r": 425.4,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 142.7,
"r_x1": 425.4,
"r_y1": 142.7,
"r_x2": 425.4,
"r_y2": 133.5,
"r_x3": 417.9,
"r_y3": 133.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 449.9,
"t": 133.5,
"r": 457.4,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 142.7,
"r_x1": 457.4,
"r_y1": 142.7,
"r_x2": 457.4,
"r_y2": 133.5,
"r_x3": 449.9,
"r_y3": 133.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 476.4,
"t": 133.8,
"r": 496.3,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 142.7,
"r_x1": 496.3,
"r_y1": 142.7,
"r_x2": 496.3,
"r_y2": 133.8,
"r_x3": 476.4,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "500k",
"orig": "500k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 512.6,
"t": 133.8,
"r": 532.6,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 142.7,
"r_x1": 532.6,
"r_y1": 142.7,
"r_x2": 532.6,
"r_y2": 133.8,
"r_x3": 512.6,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 317.1,
"t": 145.7,
"r": 369.4,
"b": 154.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 154.6,
"r_x1": 369.4,
"r_y1": 154.6,
"r_x2": 369.4,
"r_y2": 145.7,
"r_x3": 317.1,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 417.9,
"t": 145.4,
"r": 425.4,
"b": 154.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 154.7,
"r_x1": 425.4,
"r_y1": 154.7,
"r_x2": 425.4,
"r_y2": 145.4,
"r_x3": 417.9,
"r_y3": 145.4,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 449.9,
"t": 145.4,
"r": 457.4,
"b": 154.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 154.7,
"r_x1": 457.4,
"r_y1": 154.7,
"r_x2": 457.4,
"r_y2": 145.4,
"r_x3": 449.9,
"r_y3": 145.4,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 476.4,
"t": 145.7,
"r": 496.3,
"b": 154.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 154.6,
"r_x1": 496.3,
"r_y1": 154.6,
"r_x2": 496.3,
"r_y2": 145.7,
"r_x3": 476.4,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "600k",
"orig": "600k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 512.6,
"t": 145.7,
"r": 532.6,
"b": 154.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 154.6,
"r_x1": 532.6,
"r_y1": 154.6,
"r_x2": 532.6,
"r_y2": 145.7,
"r_x3": 512.6,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 7,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 412.3,
"t": 73.6,
"r": 430.9,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Tags",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 442.9,
"t": 73.6,
"r": 464.4,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "Bbox",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 477.8,
"t": 73.6,
"r": 494.9,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "Size",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 508.3,
"t": 73.6,
"r": 536.9,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "Format",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.1,
"t": 86.0,
"r": 361.6,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "PubTabNet",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.9,
"t": 85.7,
"r": 425.4,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 85.7,
"r": 457.4,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 86.0,
"r": 496.3,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "509k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.6,
"t": 86.0,
"r": 532.6,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.1,
"t": 97.9,
"r": 359.4,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "FinTabNet",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.9,
"t": 97.6,
"r": 425.4,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 97.6,
"r": 457.4,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 97.9,
"r": 496.3,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "112k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 513.5,
"t": 97.9,
"r": 531.7,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PDF",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.1,
"t": 109.9,
"r": 360.0,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableBank",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.9,
"t": 109.6,
"r": 425.4,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 450.8,
"t": 109.6,
"r": 456.5,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 109.9,
"r": 496.3,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "145k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 511.3,
"t": 109.9,
"r": 533.9,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "JPEG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.1,
"t": 121.8,
"r": 400.4,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Combined-Tabnet(*)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.9,
"t": 121.5,
"r": 425.4,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 121.5,
"r": 457.4,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 121.8,
"r": 496.3,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "400k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.6,
"t": 121.8,
"r": 532.6,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.1,
"t": 133.8,
"r": 375.2,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Combined(**)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.9,
"t": 133.5,
"r": 425.4,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 133.5,
"r": 457.4,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 133.8,
"r": 496.3,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "500k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.6,
"t": 133.8,
"r": 532.6,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.1,
"t": 145.7,
"r": 369.4,
"b": 154.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "SynthTabNet",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.9,
"t": 145.4,
"r": 425.4,
"b": 154.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 145.4,
"r": 457.4,
"b": 154.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 145.7,
"r": 496.3,
"b": 154.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "600k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.6,
"t": 145.7,
"r": 532.6,
"b": 154.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
}
]
}
}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "text",
"id": 10,
"page_no": 3,
"cluster": {
"id": 10,
"label": "text",
"bbox": {
"l": 50.1,
"t": 75.2,
"r": 286.4,
"b": 96.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.1,
"r_x1": 286.4,
"r_y1": 84.1,
"r_x2": 286.4,
"r_y2": 75.2,
"r_x3": 50.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "amount of such tables, and kept only those ones ranging",
"orig": "amount of such tables, and kept only those ones ranging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 96.1,
"r_x1": 212.3,
"r_y1": 96.1,
"r_x2": 212.3,
"r_y2": 87.2,
"r_x3": 50.1,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "between 1*1 and 20*10 (rows/columns).",
"orig": "between 1*1 and 20*10 (rows/columns).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "amount of such tables, and kept only those ones ranging between 1*1 and 20*10 (rows/columns)."
},
{
"label": "text",
"id": 1,
"page_no": 3,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.1,
"t": 101.0,
"r": 286.4,
"b": 313.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 109.9,
"r_x1": 286.4,
"r_y1": 109.9,
"r_x2": 286.4,
"r_y2": 101.0,
"r_x3": 62.1,
"r_y3": 101.0,
"coord_origin": "TOPLEFT"
},
"text": "The availability of the bounding boxes for all table cells",
"orig": "The availability of the bounding boxes for all table cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 121.8,
"r_x1": 286.4,
"r_y1": 121.8,
"r_x2": 286.4,
"r_y2": 112.9,
"r_x3": 50.1,
"r_y3": 112.9,
"coord_origin": "TOPLEFT"
},
"text": "is essential to train our models. In order to distinguish be-",
"orig": "is essential to train our models. In order to distinguish be-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 133.8,
"r_x1": 286.4,
"r_y1": 133.8,
"r_x2": 286.4,
"r_y2": 124.9,
"r_x3": 50.1,
"r_y3": 124.9,
"coord_origin": "TOPLEFT"
},
"text": "tween empty and non-empty bounding boxes, we have in-",
"orig": "tween empty and non-empty bounding boxes, we have in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 145.7,
"r_x1": 286.4,
"r_y1": 145.7,
"r_x2": 286.4,
"r_y2": 136.8,
"r_x3": 50.1,
"r_y3": 136.8,
"coord_origin": "TOPLEFT"
},
"text": "troduced a binary class in the annotation. Unfortunately, the",
"orig": "troduced a binary class in the annotation. Unfortunately, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 157.7,
"r_x1": 286.4,
"r_y1": 157.7,
"r_x2": 286.4,
"r_y2": 148.8,
"r_x3": 50.1,
"r_y3": 148.8,
"coord_origin": "TOPLEFT"
},
"text": "original datasets either omit the bounding boxes for whole",
"orig": "original datasets either omit the bounding boxes for whole",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 169.6,
"r_x1": 286.4,
"r_y1": 169.6,
"r_x2": 286.4,
"r_y2": 160.7,
"r_x3": 50.1,
"r_y3": 160.7,
"coord_origin": "TOPLEFT"
},
"text": "tables (e.g. TableBank) or they narrow their scope only to",
"orig": "tables (e.g. TableBank) or they narrow their scope only to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 181.6,
"r_x1": 286.4,
"r_y1": 181.6,
"r_x2": 286.4,
"r_y2": 172.7,
"r_x3": 50.1,
"r_y3": 172.7,
"coord_origin": "TOPLEFT"
},
"text": "non-empty cells. Therefore, it was imperative to introduce",
"orig": "non-empty cells. Therefore, it was imperative to introduce",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 193.6,
"r_x1": 286.4,
"r_y1": 193.6,
"r_x2": 286.4,
"r_y2": 184.6,
"r_x3": 50.1,
"r_y3": 184.6,
"coord_origin": "TOPLEFT"
},
"text": "a data pre-processing procedure that generates the missing",
"orig": "a data pre-processing procedure that generates the missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 205.5,
"r_x1": 286.4,
"r_y1": 205.5,
"r_x2": 286.4,
"r_y2": 196.6,
"r_x3": 50.1,
"r_y3": 196.6,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes out of the annotation information. This pro-",
"orig": "bounding boxes out of the annotation information. This pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 217.5,
"r_x1": 286.4,
"r_y1": 217.5,
"r_x2": 286.4,
"r_y2": 208.6,
"r_x3": 50.1,
"r_y3": 208.6,
"coord_origin": "TOPLEFT"
},
"text": "cedure first parses the provided table structure and calcu-",
"orig": "cedure first parses the provided table structure and calcu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 229.4,
"r_x1": 286.4,
"r_y1": 229.4,
"r_x2": 286.4,
"r_y2": 220.5,
"r_x3": 50.1,
"r_y3": 220.5,
"coord_origin": "TOPLEFT"
},
"text": "lates the dimensions of the most fine-grained grid that cov-",
"orig": "lates the dimensions of the most fine-grained grid that cov-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 241.4,
"r_x1": 286.4,
"r_y1": 241.4,
"r_x2": 286.4,
"r_y2": 232.5,
"r_x3": 50.1,
"r_y3": 232.5,
"coord_origin": "TOPLEFT"
},
"text": "ers the table structure. Notice that each table cell may oc-",
"orig": "ers the table structure. Notice that each table cell may oc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 253.3,
"r_x1": 286.4,
"r_y1": 253.3,
"r_x2": 286.4,
"r_y2": 244.4,
"r_x3": 50.1,
"r_y3": 244.4,
"coord_origin": "TOPLEFT"
},
"text": "cupy multiple grid squares due to row or column spans. In",
"orig": "cupy multiple grid squares due to row or column spans. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 265.3,
"r_x1": 286.4,
"r_y1": 265.3,
"r_x2": 286.4,
"r_y2": 256.4,
"r_x3": 50.1,
"r_y3": 256.4,
"coord_origin": "TOPLEFT"
},
"text": "case of PubTabNet we had to compute missing bounding",
"orig": "case of PubTabNet we had to compute missing bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 277.2,
"r_x1": 286.4,
"r_y1": 277.2,
"r_x2": 286.4,
"r_y2": 268.3,
"r_x3": 50.1,
"r_y3": 268.3,
"coord_origin": "TOPLEFT"
},
"text": "boxes for 48% of the simple and 69% of the complex ta-",
"orig": "boxes for 48% of the simple and 69% of the complex ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 289.2,
"r_x1": 68.7,
"r_y1": 289.2,
"r_x2": 68.7,
"r_y2": 280.3,
"r_x3": 50.1,
"r_y3": 280.3,
"coord_origin": "TOPLEFT"
},
"text": "bles.",
"orig": "bles.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 75.6,
"r_y0": 289.2,
"r_x1": 286.4,
"r_y1": 289.2,
"r_x2": 286.4,
"r_y2": 280.3,
"r_x3": 75.6,
"r_y3": 280.3,
"coord_origin": "TOPLEFT"
},
"text": "Regarding FinTabNet, 68% of the simple and 98%",
"orig": "Regarding FinTabNet, 68% of the simple and 98%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 301.2,
"r_x1": 286.4,
"r_y1": 301.2,
"r_x2": 286.4,
"r_y2": 292.2,
"r_x3": 50.1,
"r_y3": 292.2,
"coord_origin": "TOPLEFT"
},
"text": "of the complex tables require the generation of bounding",
"orig": "of the complex tables require the generation of bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 313.1,
"r_x1": 75.7,
"r_y1": 313.1,
"r_x2": 75.7,
"r_y2": 304.2,
"r_x3": 50.1,
"r_y3": 304.2,
"coord_origin": "TOPLEFT"
},
"text": "boxes.",
"orig": "boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The availability of the bounding boxes for all table cells is essential to train our models. In order to distinguish between empty and non-empty bounding boxes, we have introduced a binary class in the annotation. Unfortunately, the original datasets either omit the bounding boxes for whole tables (e.g. TableBank) or they narrow their scope only to non-empty cells. Therefore, it was imperative to introduce a data pre-processing procedure that generates the missing bounding boxes out of the annotation information. This procedure first parses the provided table structure and calculates the dimensions of the most fine-grained grid that covers the table structure. Notice that each table cell may occupy multiple grid squares due to row or column spans. In case of PubTabNet we had to compute missing bounding boxes for 48% of the simple and 69% of the complex tables. Regarding FinTabNet, 68% of the simple and 98% of the complex tables require the generation of bounding boxes."
},
{
"label": "text",
"id": 4,
"page_no": 3,
"cluster": {
"id": 4,
"label": "text",
"bbox": {
"l": 50.1,
"t": 318.0,
"r": 286.4,
"b": 434.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 326.9,
"r_x1": 286.4,
"r_y1": 326.9,
"r_x2": 286.4,
"r_y2": 318.0,
"r_x3": 62.1,
"r_y3": 318.0,
"coord_origin": "TOPLEFT"
},
"text": "As it is illustrated in Fig. 2, the table distributions from",
"orig": "As it is illustrated in Fig. 2, the table distributions from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 338.9,
"r_x1": 286.4,
"r_y1": 338.9,
"r_x2": 286.4,
"r_y2": 330.0,
"r_x3": 50.1,
"r_y3": 330.0,
"coord_origin": "TOPLEFT"
},
"text": "all datasets are skewed towards simpler structures with",
"orig": "all datasets are skewed towards simpler structures with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 350.8,
"r_x1": 286.4,
"r_y1": 350.8,
"r_x2": 286.4,
"r_y2": 341.9,
"r_x3": 50.1,
"r_y3": 341.9,
"coord_origin": "TOPLEFT"
},
"text": "fewer number of rows/columns. Additionally, there is very",
"orig": "fewer number of rows/columns. Additionally, there is very",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 362.8,
"r_x1": 286.4,
"r_y1": 362.8,
"r_x2": 286.4,
"r_y2": 353.9,
"r_x3": 50.1,
"r_y3": 353.9,
"coord_origin": "TOPLEFT"
},
"text": "limited variance in the table styles, which in case of Pub-",
"orig": "limited variance in the table styles, which in case of Pub-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 374.7,
"r_x1": 286.4,
"r_y1": 374.7,
"r_x2": 286.4,
"r_y2": 365.8,
"r_x3": 50.1,
"r_y3": 365.8,
"coord_origin": "TOPLEFT"
},
"text": "TabNet and FinTabNet means one styling format for the",
"orig": "TabNet and FinTabNet means one styling format for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 386.7,
"r_x1": 141.6,
"r_y1": 386.7,
"r_x2": 141.6,
"r_y2": 377.8,
"r_x3": 50.1,
"r_y3": 377.8,
"coord_origin": "TOPLEFT"
},
"text": "majority of the tables.",
"orig": "majority of the tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 148.7,
"r_y0": 386.7,
"r_x1": 286.4,
"r_y1": 386.7,
"r_x2": 286.4,
"r_y2": 377.8,
"r_x3": 148.7,
"r_y3": 377.8,
"coord_origin": "TOPLEFT"
},
"text": "Similar limitations appear also in",
"orig": "Similar limitations appear also in",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 398.6,
"r_x1": 286.4,
"r_y1": 398.6,
"r_x2": 286.4,
"r_y2": 389.7,
"r_x3": 50.1,
"r_y3": 389.7,
"coord_origin": "TOPLEFT"
},
"text": "the type of table content, which in some cases (e.g. FinTab-",
"orig": "the type of table content, which in some cases (e.g. FinTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 410.6,
"r_x1": 286.4,
"r_y1": 410.6,
"r_x2": 286.4,
"r_y2": 401.7,
"r_x3": 50.1,
"r_y3": 401.7,
"coord_origin": "TOPLEFT"
},
"text": "Net) is restricted to a certain domain. Ultimately, the lack",
"orig": "Net) is restricted to a certain domain. Ultimately, the lack",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 422.5,
"r_x1": 286.4,
"r_y1": 422.5,
"r_x2": 286.4,
"r_y2": 413.6,
"r_x3": 50.1,
"r_y3": 413.6,
"coord_origin": "TOPLEFT"
},
"text": "of diversity in the training dataset damages the ability of the",
"orig": "of diversity in the training dataset damages the ability of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 434.5,
"r_x1": 216.4,
"r_y1": 434.5,
"r_x2": 216.4,
"r_y2": 425.6,
"r_x3": 50.1,
"r_y3": 425.6,
"coord_origin": "TOPLEFT"
},
"text": "models to generalize well on unseen data.",
"orig": "models to generalize well on unseen data.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "As it is illustrated in Fig. 2, the table distributions from all datasets are skewed towards simpler structures with fewer number of rows/columns. Additionally, there is very limited variance in the table styles, which in case of PubTabNet and FinTabNet means one styling format for the majority of the tables. Similar limitations appear also in the type of table content, which in some cases (e.g. FinTabNet) is restricted to a certain domain. Ultimately, the lack of diversity in the training dataset damages the ability of the models to generalize well on unseen data."
},
{
"label": "text",
"id": 3,
"page_no": 3,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 50.1,
"t": 439.4,
"r": 286.4,
"b": 627.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 448.3,
"r_x1": 286.4,
"r_y1": 448.3,
"r_x2": 286.4,
"r_y2": 439.4,
"r_x3": 62.1,
"r_y3": 439.4,
"coord_origin": "TOPLEFT"
},
"text": "Motivated by those observations we aimed at generating",
"orig": "Motivated by those observations we aimed at generating",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 460.3,
"r_x1": 172.1,
"r_y1": 460.3,
"r_x2": 172.1,
"r_y2": 451.3,
"r_x3": 50.1,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": "a synthetic table dataset named",
"orig": "a synthetic table dataset named",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 174.1,
"r_y0": 460.0,
"r_x1": 224.7,
"r_y1": 460.0,
"r_x2": 224.7,
"r_y2": 451.4,
"r_x3": 174.1,
"r_y3": 451.4,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 224.7,
"r_y0": 460.3,
"r_x1": 286.4,
"r_y1": 460.3,
"r_x2": 286.4,
"r_y2": 451.3,
"r_x3": 224.7,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": ". This approach",
"orig": ". This approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 472.2,
"r_x1": 286.4,
"r_y1": 472.2,
"r_x2": 286.4,
"r_y2": 463.3,
"r_x3": 50.1,
"r_y3": 463.3,
"coord_origin": "TOPLEFT"
},
"text": "offers control over: 1) the size of the dataset, 2) the table",
"orig": "offers control over: 1) the size of the dataset, 2) the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 484.2,
"r_x1": 286.4,
"r_y1": 484.2,
"r_x2": 286.4,
"r_y2": 475.3,
"r_x3": 50.1,
"r_y3": 475.3,
"coord_origin": "TOPLEFT"
},
"text": "structure, 3) the table style and 4) the type of content. The",
"orig": "structure, 3) the table style and 4) the type of content. The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 496.1,
"r_x1": 286.4,
"r_y1": 496.1,
"r_x2": 286.4,
"r_y2": 487.2,
"r_x3": 50.1,
"r_y3": 487.2,
"coord_origin": "TOPLEFT"
},
"text": "complexity of the table structure is described by the size of",
"orig": "complexity of the table structure is described by the size of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 508.1,
"r_x1": 286.4,
"r_y1": 508.1,
"r_x2": 286.4,
"r_y2": 499.2,
"r_x3": 50.1,
"r_y3": 499.2,
"coord_origin": "TOPLEFT"
},
"text": "the table header and the table body, as well as the percentage",
"orig": "the table header and the table body, as well as the percentage",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 520.0,
"r_x1": 286.4,
"r_y1": 520.0,
"r_x2": 286.4,
"r_y2": 511.1,
"r_x3": 50.1,
"r_y3": 511.1,
"coord_origin": "TOPLEFT"
},
"text": "of the table cells covered by row spans and column spans.",
"orig": "of the table cells covered by row spans and column spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 532.0,
"r_x1": 286.4,
"r_y1": 532.0,
"r_x2": 286.4,
"r_y2": 523.1,
"r_x3": 50.1,
"r_y3": 523.1,
"coord_origin": "TOPLEFT"
},
"text": "A set of carefully designed styling templates provides the",
"orig": "A set of carefully designed styling templates provides the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 543.9,
"r_x1": 286.4,
"r_y1": 543.9,
"r_x2": 286.4,
"r_y2": 535.0,
"r_x3": 50.1,
"r_y3": 535.0,
"coord_origin": "TOPLEFT"
},
"text": "basis to build a wide range of table appearances. Lastly, the",
"orig": "basis to build a wide range of table appearances. Lastly, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 555.9,
"r_x1": 286.4,
"r_y1": 555.9,
"r_x2": 286.4,
"r_y2": 547.0,
"r_x3": 50.1,
"r_y3": 547.0,
"coord_origin": "TOPLEFT"
},
"text": "table content is generated out of a curated collection of text",
"orig": "table content is generated out of a curated collection of text",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 567.8,
"r_x1": 286.4,
"r_y1": 567.8,
"r_x2": 286.4,
"r_y2": 558.9,
"r_x3": 50.1,
"r_y3": 558.9,
"coord_origin": "TOPLEFT"
},
"text": "corpora. By controlling the size and scope of the synthetic",
"orig": "corpora. By controlling the size and scope of the synthetic",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 579.8,
"r_x1": 286.4,
"r_y1": 579.8,
"r_x2": 286.4,
"r_y2": 570.9,
"r_x3": 50.1,
"r_y3": 570.9,
"coord_origin": "TOPLEFT"
},
"text": "datasets we are able to train and evaluate our models in a",
"orig": "datasets we are able to train and evaluate our models in a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 591.8,
"r_x1": 286.4,
"r_y1": 591.8,
"r_x2": 286.4,
"r_y2": 582.9,
"r_x3": 50.1,
"r_y3": 582.9,
"coord_origin": "TOPLEFT"
},
"text": "variety of different conditions. For example, we can first",
"orig": "variety of different conditions. For example, we can first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 603.7,
"r_x1": 286.4,
"r_y1": 603.7,
"r_x2": 286.4,
"r_y2": 594.8,
"r_x3": 50.1,
"r_y3": 594.8,
"coord_origin": "TOPLEFT"
},
"text": "generate a highly diverse dataset to train our models and",
"orig": "generate a highly diverse dataset to train our models and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 615.7,
"r_x1": 286.4,
"r_y1": 615.7,
"r_x2": 286.4,
"r_y2": 606.8,
"r_x3": 50.1,
"r_y3": 606.8,
"coord_origin": "TOPLEFT"
},
"text": "then evaluate their performance on other synthetic datasets",
"orig": "then evaluate their performance on other synthetic datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 627.6,
"r_x1": 209.8,
"r_y1": 627.6,
"r_x2": 209.8,
"r_y2": 618.7,
"r_x3": 50.1,
"r_y3": 618.7,
"coord_origin": "TOPLEFT"
},
"text": "which are focused on a specific domain.",
"orig": "which are focused on a specific domain.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Motivated by those observations we aimed at generating a synthetic table dataset named SynthTabNet . This approach offers control over: 1) the size of the dataset, 2) the table structure, 3) the table style and 4) the type of content. The complexity of the table structure is described by the size of the table header and the table body, as well as the percentage of the table cells covered by row spans and column spans. A set of carefully designed styling templates provides the basis to build a wide range of table appearances. Lastly, the table content is generated out of a curated collection of text corpora. By controlling the size and scope of the synthetic datasets we are able to train and evaluate our models in a variety of different conditions. For example, we can first generate a highly diverse dataset to train our models and then evaluate their performance on other synthetic datasets which are focused on a specific domain."
},
{
"label": "text",
"id": 5,
"page_no": 3,
"cluster": {
"id": 5,
"label": "text",
"bbox": {
"l": 50.1,
"t": 632.5,
"r": 286.4,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 641.4,
"r_x1": 286.4,
"r_y1": 641.4,
"r_x2": 286.4,
"r_y2": 632.5,
"r_x3": 62.1,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": "In this regard, we have prepared four synthetic datasets,",
"orig": "In this regard, we have prepared four synthetic datasets,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 653.4,
"r_x1": 286.4,
"r_y1": 653.4,
"r_x2": 286.4,
"r_y2": 644.5,
"r_x3": 50.1,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "each one containing 150k examples. The corpora to gener-",
"orig": "each one containing 150k examples. The corpora to gener-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 665.3,
"r_x1": 286.4,
"r_y1": 665.3,
"r_x2": 286.4,
"r_y2": 656.4,
"r_x3": 50.1,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "ate the table text consists of the most frequent terms appear-",
"orig": "ate the table text consists of the most frequent terms appear-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.3,
"r_x1": 286.4,
"r_y1": 677.3,
"r_x2": 286.4,
"r_y2": 668.4,
"r_x3": 50.1,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "ing in PubTabNet and FinTabNet together with randomly",
"orig": "ing in PubTabNet and FinTabNet together with randomly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 689.2,
"r_x1": 286.4,
"r_y1": 689.2,
"r_x2": 286.4,
"r_y2": 680.3,
"r_x3": 50.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "generated text. The first two synthetic datasets have been",
"orig": "generated text. The first two synthetic datasets have been",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "fine-tuned to mimic the appearance of the original datasets",
"orig": "fine-tuned to mimic the appearance of the original datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 286.4,
"r_y1": 713.2,
"r_x2": 286.4,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "but encompass more complicated table structures. The third",
"orig": "but encompass more complicated table structures. The third",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "In this regard, we have prepared four synthetic datasets, each one containing 150k examples. The corpora to generate the table text consists of the most frequent terms appearing in PubTabNet and FinTabNet together with randomly generated text. The first two synthetic datasets have been fine-tuned to mimic the appearance of the original datasets but encompass more complicated table structures. The third"
},
{
"label": "table",
"id": 8,
"page_no": 3,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 310.7,
"t": 73.2,
"r": 543.0,
"b": 155.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 412.3,
"r_y0": 82.5,
"r_x1": 430.9,
"r_y1": 82.5,
"r_x2": 430.9,
"r_y2": 73.6,
"r_x3": 412.3,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Tags",
"orig": "Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.9,
"r_y0": 82.5,
"r_x1": 464.4,
"r_y1": 82.5,
"r_x2": 464.4,
"r_y2": 73.6,
"r_x3": 442.9,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Bbox",
"orig": "Bbox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.8,
"r_y0": 82.5,
"r_x1": 494.9,
"r_y1": 82.5,
"r_x2": 494.9,
"r_y2": 73.6,
"r_x3": 477.8,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Size",
"orig": "Size",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.3,
"r_y0": 82.5,
"r_x1": 536.9,
"r_y1": 82.5,
"r_x2": 536.9,
"r_y2": 73.6,
"r_x3": 508.3,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Format",
"orig": "Format",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 94.9,
"r_x1": 361.6,
"r_y1": 94.9,
"r_x2": 361.6,
"r_y2": 86.0,
"r_x3": 317.1,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 94.9,
"r_x1": 425.4,
"r_y1": 94.9,
"r_x2": 425.4,
"r_y2": 85.7,
"r_x3": 417.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 94.9,
"r_x1": 457.4,
"r_y1": 94.9,
"r_x2": 457.4,
"r_y2": 85.7,
"r_x3": 449.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 94.9,
"r_x1": 496.3,
"r_y1": 94.9,
"r_x2": 496.3,
"r_y2": 86.0,
"r_x3": 476.4,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "509k",
"orig": "509k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 94.9,
"r_x1": 532.6,
"r_y1": 94.9,
"r_x2": 532.6,
"r_y2": 86.0,
"r_x3": 512.6,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 106.8,
"r_x1": 359.4,
"r_y1": 106.8,
"r_x2": 359.4,
"r_y2": 97.9,
"r_x3": 317.1,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 106.8,
"r_x1": 425.4,
"r_y1": 106.8,
"r_x2": 425.4,
"r_y2": 97.6,
"r_x3": 417.9,
"r_y3": 97.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 106.8,
"r_x1": 457.4,
"r_y1": 106.8,
"r_x2": 457.4,
"r_y2": 97.6,
"r_x3": 449.9,
"r_y3": 97.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 106.8,
"r_x1": 496.3,
"r_y1": 106.8,
"r_x2": 496.3,
"r_y2": 97.9,
"r_x3": 476.4,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "112k",
"orig": "112k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.5,
"r_y0": 106.8,
"r_x1": 531.7,
"r_y1": 106.8,
"r_x2": 531.7,
"r_y2": 97.9,
"r_x3": 513.5,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "PDF",
"orig": "PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 118.8,
"r_x1": 360.0,
"r_y1": 118.8,
"r_x2": 360.0,
"r_y2": 109.9,
"r_x3": 317.1,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "TableBank",
"orig": "TableBank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 118.8,
"r_x1": 425.4,
"r_y1": 118.8,
"r_x2": 425.4,
"r_y2": 109.6,
"r_x3": 417.9,
"r_y3": 109.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.8,
"r_y0": 118.8,
"r_x1": 456.5,
"r_y1": 118.8,
"r_x2": 456.5,
"r_y2": 109.6,
"r_x3": 450.8,
"r_y3": 109.6,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 118.8,
"r_x1": 496.3,
"r_y1": 118.8,
"r_x2": 496.3,
"r_y2": 109.9,
"r_x3": 476.4,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "145k",
"orig": "145k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.3,
"r_y0": 118.8,
"r_x1": 533.9,
"r_y1": 118.8,
"r_x2": 533.9,
"r_y2": 109.9,
"r_x3": 511.3,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "JPEG",
"orig": "JPEG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 130.7,
"r_x1": 400.4,
"r_y1": 130.7,
"r_x2": 400.4,
"r_y2": 121.8,
"r_x3": 317.1,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "Combined-Tabnet(*)",
"orig": "Combined-Tabnet(*)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 130.7,
"r_x1": 425.4,
"r_y1": 130.7,
"r_x2": 425.4,
"r_y2": 121.5,
"r_x3": 417.9,
"r_y3": 121.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 130.7,
"r_x1": 457.4,
"r_y1": 130.7,
"r_x2": 457.4,
"r_y2": 121.5,
"r_x3": 449.9,
"r_y3": 121.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 130.7,
"r_x1": 496.3,
"r_y1": 130.7,
"r_x2": 496.3,
"r_y2": 121.8,
"r_x3": 476.4,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "400k",
"orig": "400k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 130.7,
"r_x1": 532.6,
"r_y1": 130.7,
"r_x2": 532.6,
"r_y2": 121.8,
"r_x3": 512.6,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 142.7,
"r_x1": 375.2,
"r_y1": 142.7,
"r_x2": 375.2,
"r_y2": 133.8,
"r_x3": 317.1,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "Combined(**)",
"orig": "Combined(**)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 142.7,
"r_x1": 425.4,
"r_y1": 142.7,
"r_x2": 425.4,
"r_y2": 133.5,
"r_x3": 417.9,
"r_y3": 133.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 142.7,
"r_x1": 457.4,
"r_y1": 142.7,
"r_x2": 457.4,
"r_y2": 133.5,
"r_x3": 449.9,
"r_y3": 133.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 142.7,
"r_x1": 496.3,
"r_y1": 142.7,
"r_x2": 496.3,
"r_y2": 133.8,
"r_x3": 476.4,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "500k",
"orig": "500k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 142.7,
"r_x1": 532.6,
"r_y1": 142.7,
"r_x2": 532.6,
"r_y2": 133.8,
"r_x3": 512.6,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 154.6,
"r_x1": 369.4,
"r_y1": 154.6,
"r_x2": 369.4,
"r_y2": 145.7,
"r_x3": 317.1,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 154.7,
"r_x1": 425.4,
"r_y1": 154.7,
"r_x2": 425.4,
"r_y2": 145.4,
"r_x3": 417.9,
"r_y3": 145.4,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 154.7,
"r_x1": 457.4,
"r_y1": 154.7,
"r_x2": 457.4,
"r_y2": 145.4,
"r_x3": 449.9,
"r_y3": 145.4,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 154.6,
"r_x1": 496.3,
"r_y1": 154.6,
"r_x2": 496.3,
"r_y2": 145.7,
"r_x3": 476.4,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "600k",
"orig": "600k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 154.6,
"r_x1": 532.6,
"r_y1": 154.6,
"r_x2": 532.6,
"r_y2": 145.7,
"r_x3": 512.6,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 17,
"label": "text",
"bbox": {
"l": 412.3,
"t": 73.6,
"r": 430.9,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 412.3,
"r_y0": 82.5,
"r_x1": 430.9,
"r_y1": 82.5,
"r_x2": 430.9,
"r_y2": 73.6,
"r_x3": 412.3,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Tags",
"orig": "Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 18,
"label": "text",
"bbox": {
"l": 442.9,
"t": 73.6,
"r": 464.4,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.9,
"r_y0": 82.5,
"r_x1": 464.4,
"r_y1": 82.5,
"r_x2": 464.4,
"r_y2": 73.6,
"r_x3": 442.9,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Bbox",
"orig": "Bbox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 19,
"label": "text",
"bbox": {
"l": 477.8,
"t": 73.6,
"r": 494.9,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.8,
"r_y0": 82.5,
"r_x1": 494.9,
"r_y1": 82.5,
"r_x2": 494.9,
"r_y2": 73.6,
"r_x3": 477.8,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Size",
"orig": "Size",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 20,
"label": "text",
"bbox": {
"l": 508.3,
"t": 73.6,
"r": 536.9,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.3,
"r_y0": 82.5,
"r_x1": 536.9,
"r_y1": 82.5,
"r_x2": 536.9,
"r_y2": 73.6,
"r_x3": 508.3,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Format",
"orig": "Format",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 21,
"label": "text",
"bbox": {
"l": 317.1,
"t": 86.0,
"r": 361.6,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 94.9,
"r_x1": 361.6,
"r_y1": 94.9,
"r_x2": 361.6,
"r_y2": 86.0,
"r_x3": 317.1,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 22,
"label": "text",
"bbox": {
"l": 417.9,
"t": 85.7,
"r": 425.4,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 94.9,
"r_x1": 425.4,
"r_y1": 94.9,
"r_x2": 425.4,
"r_y2": 85.7,
"r_x3": 417.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 23,
"label": "text",
"bbox": {
"l": 449.9,
"t": 85.7,
"r": 457.4,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 94.9,
"r_x1": 457.4,
"r_y1": 94.9,
"r_x2": 457.4,
"r_y2": 85.7,
"r_x3": 449.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 24,
"label": "text",
"bbox": {
"l": 476.4,
"t": 86.0,
"r": 496.3,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 94.9,
"r_x1": 496.3,
"r_y1": 94.9,
"r_x2": 496.3,
"r_y2": 86.0,
"r_x3": 476.4,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "509k",
"orig": "509k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 25,
"label": "text",
"bbox": {
"l": 512.6,
"t": 86.0,
"r": 532.6,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 94.9,
"r_x1": 532.6,
"r_y1": 94.9,
"r_x2": 532.6,
"r_y2": 86.0,
"r_x3": 512.6,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 26,
"label": "text",
"bbox": {
"l": 317.1,
"t": 97.9,
"r": 359.4,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 106.8,
"r_x1": 359.4,
"r_y1": 106.8,
"r_x2": 359.4,
"r_y2": 97.9,
"r_x3": 317.1,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 27,
"label": "text",
"bbox": {
"l": 417.9,
"t": 97.6,
"r": 425.4,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 106.8,
"r_x1": 425.4,
"r_y1": 106.8,
"r_x2": 425.4,
"r_y2": 97.6,
"r_x3": 417.9,
"r_y3": 97.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 28,
"label": "text",
"bbox": {
"l": 449.9,
"t": 97.6,
"r": 457.4,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 106.8,
"r_x1": 457.4,
"r_y1": 106.8,
"r_x2": 457.4,
"r_y2": 97.6,
"r_x3": 449.9,
"r_y3": 97.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "text",
"bbox": {
"l": 476.4,
"t": 97.9,
"r": 496.3,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 106.8,
"r_x1": 496.3,
"r_y1": 106.8,
"r_x2": 496.3,
"r_y2": 97.9,
"r_x3": 476.4,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "112k",
"orig": "112k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 30,
"label": "text",
"bbox": {
"l": 513.5,
"t": 97.9,
"r": 531.7,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.5,
"r_y0": 106.8,
"r_x1": 531.7,
"r_y1": 106.8,
"r_x2": 531.7,
"r_y2": 97.9,
"r_x3": 513.5,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "PDF",
"orig": "PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "text",
"bbox": {
"l": 317.1,
"t": 109.9,
"r": 360.0,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 118.8,
"r_x1": 360.0,
"r_y1": 118.8,
"r_x2": 360.0,
"r_y2": 109.9,
"r_x3": 317.1,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "TableBank",
"orig": "TableBank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 32,
"label": "text",
"bbox": {
"l": 417.9,
"t": 109.6,
"r": 425.4,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 118.8,
"r_x1": 425.4,
"r_y1": 118.8,
"r_x2": 425.4,
"r_y2": 109.6,
"r_x3": 417.9,
"r_y3": 109.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 33,
"label": "text",
"bbox": {
"l": 450.8,
"t": 109.6,
"r": 456.5,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.8,
"r_y0": 118.8,
"r_x1": 456.5,
"r_y1": 118.8,
"r_x2": 456.5,
"r_y2": 109.6,
"r_x3": 450.8,
"r_y3": 109.6,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 34,
"label": "text",
"bbox": {
"l": 476.4,
"t": 109.9,
"r": 496.3,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 118.8,
"r_x1": 496.3,
"r_y1": 118.8,
"r_x2": 496.3,
"r_y2": 109.9,
"r_x3": 476.4,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "145k",
"orig": "145k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 35,
"label": "text",
"bbox": {
"l": 511.3,
"t": 109.9,
"r": 533.9,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.3,
"r_y0": 118.8,
"r_x1": 533.9,
"r_y1": 118.8,
"r_x2": 533.9,
"r_y2": 109.9,
"r_x3": 511.3,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "JPEG",
"orig": "JPEG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 36,
"label": "text",
"bbox": {
"l": 317.1,
"t": 121.8,
"r": 400.4,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 130.7,
"r_x1": 400.4,
"r_y1": 130.7,
"r_x2": 400.4,
"r_y2": 121.8,
"r_x3": 317.1,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "Combined-Tabnet(*)",
"orig": "Combined-Tabnet(*)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 37,
"label": "text",
"bbox": {
"l": 417.9,
"t": 121.5,
"r": 425.4,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 130.7,
"r_x1": 425.4,
"r_y1": 130.7,
"r_x2": 425.4,
"r_y2": 121.5,
"r_x3": 417.9,
"r_y3": 121.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 38,
"label": "text",
"bbox": {
"l": 449.9,
"t": 121.5,
"r": 457.4,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 130.7,
"r_x1": 457.4,
"r_y1": 130.7,
"r_x2": 457.4,
"r_y2": 121.5,
"r_x3": 449.9,
"r_y3": 121.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 39,
"label": "text",
"bbox": {
"l": 476.4,
"t": 121.8,
"r": 496.3,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 130.7,
"r_x1": 496.3,
"r_y1": 130.7,
"r_x2": 496.3,
"r_y2": 121.8,
"r_x3": 476.4,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "400k",
"orig": "400k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 40,
"label": "text",
"bbox": {
"l": 512.6,
"t": 121.8,
"r": 532.6,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 130.7,
"r_x1": 532.6,
"r_y1": 130.7,
"r_x2": 532.6,
"r_y2": 121.8,
"r_x3": 512.6,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 317.1,
"t": 133.8,
"r": 375.2,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 142.7,
"r_x1": 375.2,
"r_y1": 142.7,
"r_x2": 375.2,
"r_y2": 133.8,
"r_x3": 317.1,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "Combined(**)",
"orig": "Combined(**)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 417.9,
"t": 133.5,
"r": 425.4,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 142.7,
"r_x1": 425.4,
"r_y1": 142.7,
"r_x2": 425.4,
"r_y2": 133.5,
"r_x3": 417.9,
"r_y3": 133.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 449.9,
"t": 133.5,
"r": 457.4,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 142.7,
"r_x1": 457.4,
"r_y1": 142.7,
"r_x2": 457.4,
"r_y2": 133.5,
"r_x3": 449.9,
"r_y3": 133.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 476.4,
"t": 133.8,
"r": 496.3,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 142.7,
"r_x1": 496.3,
"r_y1": 142.7,
"r_x2": 496.3,
"r_y2": 133.8,
"r_x3": 476.4,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "500k",
"orig": "500k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 512.6,
"t": 133.8,
"r": 532.6,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 142.7,
"r_x1": 532.6,
"r_y1": 142.7,
"r_x2": 532.6,
"r_y2": 133.8,
"r_x3": 512.6,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 317.1,
"t": 145.7,
"r": 369.4,
"b": 154.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 154.6,
"r_x1": 369.4,
"r_y1": 154.6,
"r_x2": 369.4,
"r_y2": 145.7,
"r_x3": 317.1,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 417.9,
"t": 145.4,
"r": 425.4,
"b": 154.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 154.7,
"r_x1": 425.4,
"r_y1": 154.7,
"r_x2": 425.4,
"r_y2": 145.4,
"r_x3": 417.9,
"r_y3": 145.4,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 449.9,
"t": 145.4,
"r": 457.4,
"b": 154.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 154.7,
"r_x1": 457.4,
"r_y1": 154.7,
"r_x2": 457.4,
"r_y2": 145.4,
"r_x3": 449.9,
"r_y3": 145.4,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 476.4,
"t": 145.7,
"r": 496.3,
"b": 154.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 154.6,
"r_x1": 496.3,
"r_y1": 154.6,
"r_x2": 496.3,
"r_y2": 145.7,
"r_x3": 476.4,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "600k",
"orig": "600k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 512.6,
"t": 145.7,
"r": 532.6,
"b": 154.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 154.6,
"r_x1": 532.6,
"r_y1": 154.6,
"r_x2": 532.6,
"r_y2": 145.7,
"r_x3": 512.6,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 7,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 412.3,
"t": 73.6,
"r": 430.9,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Tags",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 442.9,
"t": 73.6,
"r": 464.4,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "Bbox",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 477.8,
"t": 73.6,
"r": 494.9,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "Size",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 508.3,
"t": 73.6,
"r": 536.9,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "Format",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.1,
"t": 86.0,
"r": 361.6,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "PubTabNet",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.9,
"t": 85.7,
"r": 425.4,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 85.7,
"r": 457.4,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 86.0,
"r": 496.3,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "509k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.6,
"t": 86.0,
"r": 532.6,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.1,
"t": 97.9,
"r": 359.4,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "FinTabNet",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.9,
"t": 97.6,
"r": 425.4,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 97.6,
"r": 457.4,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 97.9,
"r": 496.3,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "112k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 513.5,
"t": 97.9,
"r": 531.7,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PDF",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.1,
"t": 109.9,
"r": 360.0,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableBank",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.9,
"t": 109.6,
"r": 425.4,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 450.8,
"t": 109.6,
"r": 456.5,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 109.9,
"r": 496.3,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "145k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 511.3,
"t": 109.9,
"r": 533.9,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "JPEG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.1,
"t": 121.8,
"r": 400.4,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Combined-Tabnet(*)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.9,
"t": 121.5,
"r": 425.4,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 121.5,
"r": 457.4,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 121.8,
"r": 496.3,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "400k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.6,
"t": 121.8,
"r": 532.6,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.1,
"t": 133.8,
"r": 375.2,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Combined(**)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.9,
"t": 133.5,
"r": 425.4,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 133.5,
"r": 457.4,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 133.8,
"r": 496.3,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "500k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.6,
"t": 133.8,
"r": 532.6,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.1,
"t": 145.7,
"r": 369.4,
"b": 154.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "SynthTabNet",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.9,
"t": 145.4,
"r": 425.4,
"b": 154.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 145.4,
"r": 457.4,
"b": 154.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 145.7,
"r": 496.3,
"b": 154.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "600k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.6,
"t": 145.7,
"r": 532.6,
"b": 154.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 9,
"page_no": 3,
"cluster": {
"id": 9,
"label": "caption",
"bbox": {
"l": 308.9,
"t": 167.7,
"r": 545.1,
"b": 224.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 176.6,
"r_x1": 344.6,
"r_y1": 176.6,
"r_x2": 344.6,
"r_y2": 167.7,
"r_x3": 308.9,
"r_y3": 167.7,
"coord_origin": "TOPLEFT"
},
"text": "Table 1:",
"orig": "Table 1:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 361.1,
"r_y0": 176.6,
"r_x1": 380.5,
"r_y1": 176.6,
"r_x2": 380.5,
"r_y2": 167.7,
"r_x3": 361.1,
"r_y3": 167.7,
"coord_origin": "TOPLEFT"
},
"text": "Both",
"orig": "Both",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 386.6,
"r_y0": 176.3,
"r_x1": 468.7,
"r_y1": 176.3,
"r_x2": 468.7,
"r_y2": 167.8,
"r_x3": 386.6,
"r_y3": 167.8,
"coord_origin": "TOPLEFT"
},
"text": "\u201cCombined-Tabnet\u201d",
"orig": "\u201cCombined-Tabnet\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 474.8,
"r_y0": 176.6,
"r_x1": 489.2,
"r_y1": 176.6,
"r_x2": 489.2,
"r_y2": 167.7,
"r_x3": 474.8,
"r_y3": 167.7,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 495.3,
"r_y0": 176.3,
"r_x1": 545.1,
"r_y1": 176.3,
"r_x2": 545.1,
"r_y2": 167.8,
"r_x3": 495.3,
"r_y3": 167.8,
"coord_origin": "TOPLEFT"
},
"text": "\u201dCombined-",
"orig": "\u201dCombined-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 188.3,
"r_x1": 341.2,
"r_y1": 188.3,
"r_x2": 341.2,
"r_y2": 179.7,
"r_x3": 308.9,
"r_y3": 179.7,
"coord_origin": "TOPLEFT"
},
"text": "Tabnet\u201d",
"orig": "Tabnet\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 343.5,
"r_y0": 188.5,
"r_x1": 545.1,
"r_y1": 188.5,
"r_x2": 545.1,
"r_y2": 179.6,
"r_x3": 343.5,
"r_y3": 179.6,
"coord_origin": "TOPLEFT"
},
"text": "are variations of the following: (*) The Combined-",
"orig": "are variations of the following: (*) The Combined-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 200.5,
"r_x1": 545.1,
"r_y1": 200.5,
"r_x2": 545.1,
"r_y2": 191.6,
"r_x3": 308.9,
"r_y3": 191.6,
"coord_origin": "TOPLEFT"
},
"text": "Tabnet dataset is the processed combination of PubTabNet",
"orig": "Tabnet dataset is the processed combination of PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 212.4,
"r_x1": 545.1,
"r_y1": 212.4,
"r_x2": 545.1,
"r_y2": 203.5,
"r_x3": 308.9,
"r_y3": 203.5,
"coord_origin": "TOPLEFT"
},
"text": "and Fintabnet. (**) The combined dataset is the processed",
"orig": "and Fintabnet. (**) The combined dataset is the processed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 224.4,
"r_x1": 523.9,
"r_y1": 224.4,
"r_x2": 523.9,
"r_y2": 215.5,
"r_x3": 308.9,
"r_y3": 215.5,
"coord_origin": "TOPLEFT"
},
"text": "combination of PubTabNet, Fintabnet and TableBank.",
"orig": "combination of PubTabNet, Fintabnet and TableBank.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Table 1: Both \"Combined-Tabnet\" and \"CombinedTabnet\" are variations of the following: (*) The CombinedTabnet dataset is the processed combination of PubTabNet and Fintabnet. (**) The combined dataset is the processed combination of PubTabNet, Fintabnet and TableBank."
},
{
"label": "text",
"id": 6,
"page_no": 3,
"cluster": {
"id": 6,
"label": "text",
"bbox": {
"l": 308.9,
"t": 249.6,
"r": 545.1,
"b": 294.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 258.5,
"r_x1": 545.1,
"r_y1": 258.5,
"r_x2": 545.1,
"r_y2": 249.6,
"r_x3": 308.9,
"r_y3": 249.6,
"coord_origin": "TOPLEFT"
},
"text": "one adopts a colorful appearance with high contrast and the",
"orig": "one adopts a colorful appearance with high contrast and the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 270.5,
"r_x1": 545.1,
"r_y1": 270.5,
"r_x2": 545.1,
"r_y2": 261.6,
"r_x3": 308.9,
"r_y3": 261.6,
"coord_origin": "TOPLEFT"
},
"text": "last one contains tables with sparse content. Lastly, we have",
"orig": "last one contains tables with sparse content. Lastly, we have",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 282.4,
"r_x1": 545.1,
"r_y1": 282.4,
"r_x2": 545.1,
"r_y2": 273.5,
"r_x3": 308.9,
"r_y3": 273.5,
"coord_origin": "TOPLEFT"
},
"text": "combined all synthetic datasets into one big unified syn-",
"orig": "combined all synthetic datasets into one big unified syn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 294.4,
"r_x1": 436.8,
"r_y1": 294.4,
"r_x2": 436.8,
"r_y2": 285.5,
"r_x3": 308.9,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "thetic dataset of 600k examples.",
"orig": "thetic dataset of 600k examples.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "one adopts a colorful appearance with high contrast and the last one contains tables with sparse content. Lastly, we have combined all synthetic datasets into one big unified synthetic dataset of 600k examples."
},
{
"label": "text",
"id": 13,
"page_no": 3,
"cluster": {
"id": 13,
"label": "text",
"bbox": {
"l": 320.8,
"t": 297.8,
"r": 542.7,
"b": 306.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 306.7,
"r_x1": 542.7,
"r_y1": 306.7,
"r_x2": 542.7,
"r_y2": 297.8,
"r_x3": 320.8,
"r_y3": 297.8,
"coord_origin": "TOPLEFT"
},
"text": "Tab. 1 summarizes the various attributes of the datasets.",
"orig": "Tab. 1 summarizes the various attributes of the datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Tab. 1 summarizes the various attributes of the datasets."
},
{
"label": "section_header",
"id": 11,
"page_no": 3,
"cluster": {
"id": 11,
"label": "section_header",
"bbox": {
"l": 308.9,
"t": 321.2,
"r": 444.9,
"b": 331.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 331.9,
"r_x1": 316.3,
"r_y1": 331.9,
"r_x2": 316.3,
"r_y2": 321.2,
"r_x3": 308.9,
"r_y3": 321.2,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.2,
"r_y0": 331.9,
"r_x1": 444.9,
"r_y1": 331.9,
"r_x2": 444.9,
"r_y2": 321.2,
"r_x3": 326.2,
"r_y3": 321.2,
"coord_origin": "TOPLEFT"
},
"text": "The TableFormer model",
"orig": "The TableFormer model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "4. The TableFormer model"
},
{
"label": "text",
"id": 0,
"page_no": 3,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 308.9,
"t": 341.9,
"r": 545.1,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 350.8,
"r_x1": 545.1,
"r_y1": 350.8,
"r_x2": 545.1,
"r_y2": 341.9,
"r_x3": 320.8,
"r_y3": 341.9,
"coord_origin": "TOPLEFT"
},
"text": "Given the image of a table, TableFormer is able to pre-",
"orig": "Given the image of a table, TableFormer is able to pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 362.8,
"r_x1": 545.1,
"r_y1": 362.8,
"r_x2": 545.1,
"r_y2": 353.9,
"r_x3": 308.9,
"r_y3": 353.9,
"coord_origin": "TOPLEFT"
},
"text": "dict: 1) a sequence of tokens that represent the structure of",
"orig": "dict: 1) a sequence of tokens that represent the structure of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 374.8,
"r_x1": 545.1,
"r_y1": 374.8,
"r_x2": 545.1,
"r_y2": 365.8,
"r_x3": 308.9,
"r_y3": 365.8,
"coord_origin": "TOPLEFT"
},
"text": "a table, and 2) a bounding box coupled to a subset of those",
"orig": "a table, and 2) a bounding box coupled to a subset of those",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 386.7,
"r_x1": 545.1,
"r_y1": 386.7,
"r_x2": 545.1,
"r_y2": 377.8,
"r_x3": 308.9,
"r_y3": 377.8,
"coord_origin": "TOPLEFT"
},
"text": "tokens. The conversion of an image into a sequence of to-",
"orig": "tokens. The conversion of an image into a sequence of to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 398.7,
"r_x1": 545.1,
"r_y1": 398.7,
"r_x2": 545.1,
"r_y2": 389.8,
"r_x3": 308.9,
"r_y3": 389.8,
"coord_origin": "TOPLEFT"
},
"text": "kens is a well-known task [35, 16]. While attention is often",
"orig": "kens is a well-known task [35, 16]. While attention is often",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 410.6,
"r_x1": 545.1,
"r_y1": 410.6,
"r_x2": 545.1,
"r_y2": 401.7,
"r_x3": 308.9,
"r_y3": 401.7,
"coord_origin": "TOPLEFT"
},
"text": "used as an implicit method to associate each token of the",
"orig": "used as an implicit method to associate each token of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 422.6,
"r_x1": 545.1,
"r_y1": 422.6,
"r_x2": 545.1,
"r_y2": 413.7,
"r_x3": 308.9,
"r_y3": 413.7,
"coord_origin": "TOPLEFT"
},
"text": "sequence with a position in the original image, an explicit",
"orig": "sequence with a position in the original image, an explicit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 434.5,
"r_x1": 545.1,
"r_y1": 434.5,
"r_x2": 545.1,
"r_y2": 425.6,
"r_x3": 308.9,
"r_y3": 425.6,
"coord_origin": "TOPLEFT"
},
"text": "association between the individual table-cells and the image",
"orig": "association between the individual table-cells and the image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 446.5,
"r_x1": 437.9,
"r_y1": 446.5,
"r_x2": 437.9,
"r_y2": 437.6,
"r_x3": 308.9,
"r_y3": 437.6,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes is also required.",
"orig": "bounding boxes is also required.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Given the image of a table, TableFormer is able to predict: 1) a sequence of tokens that represent the structure of a table, and 2) a bounding box coupled to a subset of those tokens. The conversion of an image into a sequence of tokens is a well-known task [35, 16]. While attention is often used as an implicit method to associate each token of the sequence with a position in the original image, an explicit association between the individual table-cells and the image bounding boxes is also required."
},
{
"label": "section_header",
"id": 12,
"page_no": 3,
"cluster": {
"id": 12,
"label": "section_header",
"bbox": {
"l": 308.9,
"t": 457.7,
"r": 420.2,
"b": 467.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 467.5,
"r_x1": 323.1,
"r_y1": 467.5,
"r_x2": 323.1,
"r_y2": 457.7,
"r_x3": 308.9,
"r_y3": 457.7,
"coord_origin": "TOPLEFT"
},
"text": "4.1.",
"orig": "4.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 332.7,
"r_y0": 467.5,
"r_x1": 420.2,
"r_y1": 467.5,
"r_x2": 420.2,
"r_y2": 457.7,
"r_x3": 332.7,
"r_y3": 457.7,
"coord_origin": "TOPLEFT"
},
"text": "Model architecture.",
"orig": "Model architecture.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "4.1. Model architecture."
},
{
"label": "text",
"id": 2,
"page_no": 3,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 308.9,
"t": 476.8,
"r": 545.1,
"b": 665.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 485.7,
"r_x1": 545.1,
"r_y1": 485.7,
"r_x2": 545.1,
"r_y2": 476.8,
"r_x3": 320.8,
"r_y3": 476.8,
"coord_origin": "TOPLEFT"
},
"text": "We now describe in detail the proposed method, which",
"orig": "We now describe in detail the proposed method, which",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 497.6,
"r_x1": 509.0,
"r_y1": 497.6,
"r_x2": 509.0,
"r_y2": 488.7,
"r_x3": 308.9,
"r_y3": 488.7,
"coord_origin": "TOPLEFT"
},
"text": "is composed of three main components, see Fig.",
"orig": "is composed of three main components, see Fig.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.6,
"r_y0": 497.6,
"r_x1": 523.1,
"r_y1": 497.6,
"r_x2": 523.1,
"r_y2": 488.7,
"r_x3": 515.6,
"r_y3": 488.7,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 529.6,
"r_y0": 497.6,
"r_x1": 545.1,
"r_y1": 497.6,
"r_x2": 545.1,
"r_y2": 488.7,
"r_x3": 529.6,
"r_y3": 488.7,
"coord_origin": "TOPLEFT"
},
"text": "Our",
"orig": "Our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 509.4,
"r_x1": 406.3,
"r_y1": 509.4,
"r_x2": 406.3,
"r_y2": 500.8,
"r_x3": 308.9,
"r_y3": 500.8,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network",
"orig": "CNN Backbone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.9,
"r_y0": 509.6,
"r_x1": 545.1,
"r_y1": 509.6,
"r_x2": 545.1,
"r_y2": 500.7,
"r_x3": 408.9,
"r_y3": 500.7,
"coord_origin": "TOPLEFT"
},
"text": "encodes the input as a feature vec-",
"orig": "encodes the input as a feature vec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 521.5,
"r_x1": 409.4,
"r_y1": 521.5,
"r_x2": 409.4,
"r_y2": 512.6,
"r_x3": 308.9,
"r_y3": 512.6,
"coord_origin": "TOPLEFT"
},
"text": "tor of predefined length.",
"orig": "tor of predefined length.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 416.7,
"r_y0": 521.5,
"r_x1": 545.1,
"r_y1": 521.5,
"r_x2": 545.1,
"r_y2": 512.6,
"r_x3": 416.7,
"r_y3": 512.6,
"coord_origin": "TOPLEFT"
},
"text": "The input feature vector of the",
"orig": "The input feature vector of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 533.5,
"r_x1": 436.2,
"r_y1": 533.5,
"r_x2": 436.2,
"r_y2": 524.6,
"r_x3": 308.9,
"r_y3": 524.6,
"coord_origin": "TOPLEFT"
},
"text": "encoded image is passed to the",
"orig": "encoded image is passed to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 439.5,
"r_y0": 533.3,
"r_x1": 513.9,
"r_y1": 533.3,
"r_x2": 513.9,
"r_y2": 524.7,
"r_x3": 439.5,
"r_y3": 524.7,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 517.4,
"r_y0": 533.5,
"r_x1": 545.1,
"r_y1": 533.5,
"r_x2": 545.1,
"r_y2": 524.6,
"r_x3": 517.4,
"r_y3": 524.6,
"coord_origin": "TOPLEFT"
},
"text": "to pro-",
"orig": "to pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 545.4,
"r_x1": 545.1,
"r_y1": 545.4,
"r_x2": 545.1,
"r_y2": 536.5,
"r_x3": 308.9,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "duce a sequence of HTML tags that represent the structure",
"orig": "duce a sequence of HTML tags that represent the structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 557.4,
"r_x1": 358.5,
"r_y1": 557.4,
"r_x2": 358.5,
"r_y2": 548.5,
"r_x3": 308.9,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "of the table.",
"orig": "of the table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 365.2,
"r_y0": 557.4,
"r_x1": 545.1,
"r_y1": 557.4,
"r_x2": 545.1,
"r_y2": 548.5,
"r_x3": 365.2,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "With each prediction of an HTML standard",
"orig": "With each prediction of an HTML standard",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 569.4,
"r_x1": 352.4,
"r_y1": 569.4,
"r_x2": 352.4,
"r_y2": 560.5,
"r_x3": 308.9,
"r_y3": 560.5,
"coord_origin": "TOPLEFT"
},
"text": "data cell (\u2018",
"orig": "data cell (\u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.4,
"r_y0": 569.1,
"r_x1": 360.2,
"r_y1": 569.1,
"r_x2": 360.2,
"r_y2": 560.3,
"r_x3": 352.4,
"r_y3": 560.3,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.2,
"r_y0": 569.4,
"r_x1": 367.9,
"r_y1": 569.4,
"r_x2": 367.9,
"r_y2": 560.5,
"r_x3": 360.2,
"r_y3": 560.5,
"coord_origin": "TOPLEFT"
},
"text": "td",
"orig": "td",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.9,
"r_y0": 569.1,
"r_x1": 375.7,
"r_y1": 569.1,
"r_x2": 375.7,
"r_y2": 560.3,
"r_x3": 367.9,
"r_y3": 560.3,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 375.7,
"r_y0": 569.4,
"r_x1": 545.1,
"r_y1": 569.4,
"r_x2": 545.1,
"r_y2": 560.5,
"r_x3": 375.7,
"r_y3": 560.5,
"coord_origin": "TOPLEFT"
},
"text": "\u2019) the hidden state of that cell is passed to",
"orig": "\u2019) the hidden state of that cell is passed to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 581.3,
"r_x1": 545.1,
"r_y1": 581.3,
"r_x2": 545.1,
"r_y2": 572.4,
"r_x3": 308.9,
"r_y3": 572.4,
"coord_origin": "TOPLEFT"
},
"text": "the Cell BBox Decoder. As for spanning cells, such as row",
"orig": "the Cell BBox Decoder. As for spanning cells, such as row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 593.3,
"r_x1": 483.1,
"r_y1": 593.3,
"r_x2": 483.1,
"r_y2": 584.4,
"r_x3": 308.9,
"r_y3": 584.4,
"coord_origin": "TOPLEFT"
},
"text": "or column span, the tag is broken down to \u2018",
"orig": "or column span, the tag is broken down to \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.1,
"r_y0": 593.0,
"r_x1": 490.9,
"r_y1": 593.0,
"r_x2": 490.9,
"r_y2": 584.2,
"r_x3": 483.1,
"r_y3": 584.2,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.9,
"r_y0": 593.3,
"r_x1": 545.1,
"r_y1": 593.3,
"r_x2": 545.1,
"r_y2": 584.4,
"r_x3": 490.9,
"r_y3": 584.4,
"coord_origin": "TOPLEFT"
},
"text": "\u2019, \u2018rowspan=\u2019",
"orig": "\u2019, \u2018rowspan=\u2019",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 605.2,
"r_x1": 545.1,
"r_y1": 605.2,
"r_x2": 545.1,
"r_y2": 596.3,
"r_x3": 308.9,
"r_y3": 596.3,
"coord_origin": "TOPLEFT"
},
"text": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),",
"orig": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 617.2,
"r_x1": 329.6,
"r_y1": 617.2,
"r_x2": 329.6,
"r_y2": 608.3,
"r_x3": 308.9,
"r_y3": 608.3,
"coord_origin": "TOPLEFT"
},
"text": "and \u2018",
"orig": "and \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.6,
"r_y0": 617.0,
"r_x1": 337.4,
"r_y1": 617.0,
"r_x2": 337.4,
"r_y2": 608.1,
"r_x3": 329.6,
"r_y3": 608.1,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 337.4,
"r_y0": 617.2,
"r_x1": 468.6,
"r_y1": 617.2,
"r_x2": 468.6,
"r_y2": 608.3,
"r_x3": 337.4,
"r_y3": 608.3,
"coord_origin": "TOPLEFT"
},
"text": "\u2019. The hidden state attached to \u2018",
"orig": "\u2019. The hidden state attached to \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.6,
"r_y0": 617.0,
"r_x1": 476.3,
"r_y1": 617.0,
"r_x2": 476.3,
"r_y2": 608.1,
"r_x3": 468.6,
"r_y3": 608.1,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.3,
"r_y0": 617.2,
"r_x1": 545.1,
"r_y1": 617.2,
"r_x2": 545.1,
"r_y2": 608.3,
"r_x3": 476.3,
"r_y3": 608.3,
"coord_origin": "TOPLEFT"
},
"text": "\u2019 is passed to the",
"orig": "\u2019 is passed to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 629.1,
"r_x1": 545.1,
"r_y1": 629.1,
"r_x2": 545.1,
"r_y2": 620.2,
"r_x3": 308.9,
"r_y3": 620.2,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder. A shared feed forward network (FFN)",
"orig": "Cell BBox Decoder. A shared feed forward network (FFN)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 641.1,
"r_x1": 545.1,
"r_y1": 641.1,
"r_x2": 545.1,
"r_y2": 632.2,
"r_x3": 308.9,
"r_y3": 632.2,
"coord_origin": "TOPLEFT"
},
"text": "receives the hidden states from the Structure Decoder, to",
"orig": "receives the hidden states from the Structure Decoder, to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 653.0,
"r_x1": 545.1,
"r_y1": 653.0,
"r_x2": 545.1,
"r_y2": 644.1,
"r_x3": 308.9,
"r_y3": 644.1,
"coord_origin": "TOPLEFT"
},
"text": "provide the final detection predictions of the bounding box",
"orig": "provide the final detection predictions of the bounding box",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 665.0,
"r_x1": 449.4,
"r_y1": 665.0,
"r_x2": 449.4,
"r_y2": 656.1,
"r_x3": 308.9,
"r_y3": 656.1,
"coord_origin": "TOPLEFT"
},
"text": "coordinates and their classification.",
"orig": "coordinates and their classification.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "We now describe in detail the proposed method, which is composed of three main components, see Fig. 4. Our CNN Backbone Network encodes the input as a feature vector of predefined length. The input feature vector of the encoded image is passed to the Structure Decoder to produce a sequence of HTML tags that represent the structure of the table. With each prediction of an HTML standard data cell (' < td > ') the hidden state of that cell is passed to the Cell BBox Decoder. As for spanning cells, such as row or column span, the tag is broken down to ' < ', 'rowspan=' or 'colspan=', with the number of spanning cells (attribute), and ' > '. The hidden state attached to ' < ' is passed to the Cell BBox Decoder. A shared feed forward network (FFN) receives the hidden states from the Structure Decoder, to provide the final detection predictions of the bounding box coordinates and their classification."
},
{
"label": "text",
"id": 7,
"page_no": 3,
"cluster": {
"id": 7,
"label": "text",
"bbox": {
"l": 308.9,
"t": 668.3,
"r": 545.1,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 677.2,
"r_x1": 431.9,
"r_y1": 677.2,
"r_x2": 431.9,
"r_y2": 668.3,
"r_x3": 320.8,
"r_y3": 668.3,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network.",
"orig": "CNN Backbone Network.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 439.5,
"r_y0": 677.3,
"r_x1": 545.1,
"r_y1": 677.3,
"r_x2": 545.1,
"r_y2": 668.4,
"r_x3": 439.5,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "A ResNet-18 CNN is the",
"orig": "A ResNet-18 CNN is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 689.2,
"r_x1": 545.1,
"r_y1": 689.2,
"r_x2": 545.1,
"r_y2": 680.3,
"r_x3": 308.9,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "backbone that receives the table image and encodes it as a",
"orig": "backbone that receives the table image and encodes it as a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 308.9,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "vector of predefined length. The network has been modified",
"orig": "vector of predefined length. The network has been modified",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 545.1,
"r_y1": 713.2,
"r_x2": 545.1,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "by removing the linear and pooling layer, as we are not per-",
"orig": "by removing the linear and pooling layer, as we are not per-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "CNN Backbone Network. A ResNet-18 CNN is the backbone that receives the table image and encodes it as a vector of predefined length. The network has been modified by removing the linear and pooling layer, as we are not per-"
},
{
"label": "page_footer",
"id": 14,
"page_no": 3,
"cluster": {
"id": 14,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.86,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "4"
}
],
"body": [
{
"label": "text",
"id": 10,
"page_no": 3,
"cluster": {
"id": 10,
"label": "text",
"bbox": {
"l": 50.1,
"t": 75.2,
"r": 286.4,
"b": 96.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.1,
"r_x1": 286.4,
"r_y1": 84.1,
"r_x2": 286.4,
"r_y2": 75.2,
"r_x3": 50.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "amount of such tables, and kept only those ones ranging",
"orig": "amount of such tables, and kept only those ones ranging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 96.1,
"r_x1": 212.3,
"r_y1": 96.1,
"r_x2": 212.3,
"r_y2": 87.2,
"r_x3": 50.1,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "between 1*1 and 20*10 (rows/columns).",
"orig": "between 1*1 and 20*10 (rows/columns).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "amount of such tables, and kept only those ones ranging between 1*1 and 20*10 (rows/columns)."
},
{
"label": "text",
"id": 1,
"page_no": 3,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.1,
"t": 101.0,
"r": 286.4,
"b": 313.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 109.9,
"r_x1": 286.4,
"r_y1": 109.9,
"r_x2": 286.4,
"r_y2": 101.0,
"r_x3": 62.1,
"r_y3": 101.0,
"coord_origin": "TOPLEFT"
},
"text": "The availability of the bounding boxes for all table cells",
"orig": "The availability of the bounding boxes for all table cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 121.8,
"r_x1": 286.4,
"r_y1": 121.8,
"r_x2": 286.4,
"r_y2": 112.9,
"r_x3": 50.1,
"r_y3": 112.9,
"coord_origin": "TOPLEFT"
},
"text": "is essential to train our models. In order to distinguish be-",
"orig": "is essential to train our models. In order to distinguish be-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 133.8,
"r_x1": 286.4,
"r_y1": 133.8,
"r_x2": 286.4,
"r_y2": 124.9,
"r_x3": 50.1,
"r_y3": 124.9,
"coord_origin": "TOPLEFT"
},
"text": "tween empty and non-empty bounding boxes, we have in-",
"orig": "tween empty and non-empty bounding boxes, we have in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 145.7,
"r_x1": 286.4,
"r_y1": 145.7,
"r_x2": 286.4,
"r_y2": 136.8,
"r_x3": 50.1,
"r_y3": 136.8,
"coord_origin": "TOPLEFT"
},
"text": "troduced a binary class in the annotation. Unfortunately, the",
"orig": "troduced a binary class in the annotation. Unfortunately, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 157.7,
"r_x1": 286.4,
"r_y1": 157.7,
"r_x2": 286.4,
"r_y2": 148.8,
"r_x3": 50.1,
"r_y3": 148.8,
"coord_origin": "TOPLEFT"
},
"text": "original datasets either omit the bounding boxes for whole",
"orig": "original datasets either omit the bounding boxes for whole",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 169.6,
"r_x1": 286.4,
"r_y1": 169.6,
"r_x2": 286.4,
"r_y2": 160.7,
"r_x3": 50.1,
"r_y3": 160.7,
"coord_origin": "TOPLEFT"
},
"text": "tables (e.g. TableBank) or they narrow their scope only to",
"orig": "tables (e.g. TableBank) or they narrow their scope only to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 181.6,
"r_x1": 286.4,
"r_y1": 181.6,
"r_x2": 286.4,
"r_y2": 172.7,
"r_x3": 50.1,
"r_y3": 172.7,
"coord_origin": "TOPLEFT"
},
"text": "non-empty cells. Therefore, it was imperative to introduce",
"orig": "non-empty cells. Therefore, it was imperative to introduce",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 193.6,
"r_x1": 286.4,
"r_y1": 193.6,
"r_x2": 286.4,
"r_y2": 184.6,
"r_x3": 50.1,
"r_y3": 184.6,
"coord_origin": "TOPLEFT"
},
"text": "a data pre-processing procedure that generates the missing",
"orig": "a data pre-processing procedure that generates the missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 205.5,
"r_x1": 286.4,
"r_y1": 205.5,
"r_x2": 286.4,
"r_y2": 196.6,
"r_x3": 50.1,
"r_y3": 196.6,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes out of the annotation information. This pro-",
"orig": "bounding boxes out of the annotation information. This pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 217.5,
"r_x1": 286.4,
"r_y1": 217.5,
"r_x2": 286.4,
"r_y2": 208.6,
"r_x3": 50.1,
"r_y3": 208.6,
"coord_origin": "TOPLEFT"
},
"text": "cedure first parses the provided table structure and calcu-",
"orig": "cedure first parses the provided table structure and calcu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 229.4,
"r_x1": 286.4,
"r_y1": 229.4,
"r_x2": 286.4,
"r_y2": 220.5,
"r_x3": 50.1,
"r_y3": 220.5,
"coord_origin": "TOPLEFT"
},
"text": "lates the dimensions of the most fine-grained grid that cov-",
"orig": "lates the dimensions of the most fine-grained grid that cov-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 241.4,
"r_x1": 286.4,
"r_y1": 241.4,
"r_x2": 286.4,
"r_y2": 232.5,
"r_x3": 50.1,
"r_y3": 232.5,
"coord_origin": "TOPLEFT"
},
"text": "ers the table structure. Notice that each table cell may oc-",
"orig": "ers the table structure. Notice that each table cell may oc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 253.3,
"r_x1": 286.4,
"r_y1": 253.3,
"r_x2": 286.4,
"r_y2": 244.4,
"r_x3": 50.1,
"r_y3": 244.4,
"coord_origin": "TOPLEFT"
},
"text": "cupy multiple grid squares due to row or column spans. In",
"orig": "cupy multiple grid squares due to row or column spans. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 265.3,
"r_x1": 286.4,
"r_y1": 265.3,
"r_x2": 286.4,
"r_y2": 256.4,
"r_x3": 50.1,
"r_y3": 256.4,
"coord_origin": "TOPLEFT"
},
"text": "case of PubTabNet we had to compute missing bounding",
"orig": "case of PubTabNet we had to compute missing bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 277.2,
"r_x1": 286.4,
"r_y1": 277.2,
"r_x2": 286.4,
"r_y2": 268.3,
"r_x3": 50.1,
"r_y3": 268.3,
"coord_origin": "TOPLEFT"
},
"text": "boxes for 48% of the simple and 69% of the complex ta-",
"orig": "boxes for 48% of the simple and 69% of the complex ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 289.2,
"r_x1": 68.7,
"r_y1": 289.2,
"r_x2": 68.7,
"r_y2": 280.3,
"r_x3": 50.1,
"r_y3": 280.3,
"coord_origin": "TOPLEFT"
},
"text": "bles.",
"orig": "bles.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 75.6,
"r_y0": 289.2,
"r_x1": 286.4,
"r_y1": 289.2,
"r_x2": 286.4,
"r_y2": 280.3,
"r_x3": 75.6,
"r_y3": 280.3,
"coord_origin": "TOPLEFT"
},
"text": "Regarding FinTabNet, 68% of the simple and 98%",
"orig": "Regarding FinTabNet, 68% of the simple and 98%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 301.2,
"r_x1": 286.4,
"r_y1": 301.2,
"r_x2": 286.4,
"r_y2": 292.2,
"r_x3": 50.1,
"r_y3": 292.2,
"coord_origin": "TOPLEFT"
},
"text": "of the complex tables require the generation of bounding",
"orig": "of the complex tables require the generation of bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 313.1,
"r_x1": 75.7,
"r_y1": 313.1,
"r_x2": 75.7,
"r_y2": 304.2,
"r_x3": 50.1,
"r_y3": 304.2,
"coord_origin": "TOPLEFT"
},
"text": "boxes.",
"orig": "boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The availability of the bounding boxes for all table cells is essential to train our models. In order to distinguish between empty and non-empty bounding boxes, we have introduced a binary class in the annotation. Unfortunately, the original datasets either omit the bounding boxes for whole tables (e.g. TableBank) or they narrow their scope only to non-empty cells. Therefore, it was imperative to introduce a data pre-processing procedure that generates the missing bounding boxes out of the annotation information. This procedure first parses the provided table structure and calculates the dimensions of the most fine-grained grid that covers the table structure. Notice that each table cell may occupy multiple grid squares due to row or column spans. In case of PubTabNet we had to compute missing bounding boxes for 48% of the simple and 69% of the complex tables. Regarding FinTabNet, 68% of the simple and 98% of the complex tables require the generation of bounding boxes."
},
{
"label": "text",
"id": 4,
"page_no": 3,
"cluster": {
"id": 4,
"label": "text",
"bbox": {
"l": 50.1,
"t": 318.0,
"r": 286.4,
"b": 434.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 326.9,
"r_x1": 286.4,
"r_y1": 326.9,
"r_x2": 286.4,
"r_y2": 318.0,
"r_x3": 62.1,
"r_y3": 318.0,
"coord_origin": "TOPLEFT"
},
"text": "As it is illustrated in Fig. 2, the table distributions from",
"orig": "As it is illustrated in Fig. 2, the table distributions from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 338.9,
"r_x1": 286.4,
"r_y1": 338.9,
"r_x2": 286.4,
"r_y2": 330.0,
"r_x3": 50.1,
"r_y3": 330.0,
"coord_origin": "TOPLEFT"
},
"text": "all datasets are skewed towards simpler structures with",
"orig": "all datasets are skewed towards simpler structures with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 350.8,
"r_x1": 286.4,
"r_y1": 350.8,
"r_x2": 286.4,
"r_y2": 341.9,
"r_x3": 50.1,
"r_y3": 341.9,
"coord_origin": "TOPLEFT"
},
"text": "fewer number of rows/columns. Additionally, there is very",
"orig": "fewer number of rows/columns. Additionally, there is very",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 362.8,
"r_x1": 286.4,
"r_y1": 362.8,
"r_x2": 286.4,
"r_y2": 353.9,
"r_x3": 50.1,
"r_y3": 353.9,
"coord_origin": "TOPLEFT"
},
"text": "limited variance in the table styles, which in case of Pub-",
"orig": "limited variance in the table styles, which in case of Pub-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 374.7,
"r_x1": 286.4,
"r_y1": 374.7,
"r_x2": 286.4,
"r_y2": 365.8,
"r_x3": 50.1,
"r_y3": 365.8,
"coord_origin": "TOPLEFT"
},
"text": "TabNet and FinTabNet means one styling format for the",
"orig": "TabNet and FinTabNet means one styling format for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 386.7,
"r_x1": 141.6,
"r_y1": 386.7,
"r_x2": 141.6,
"r_y2": 377.8,
"r_x3": 50.1,
"r_y3": 377.8,
"coord_origin": "TOPLEFT"
},
"text": "majority of the tables.",
"orig": "majority of the tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 148.7,
"r_y0": 386.7,
"r_x1": 286.4,
"r_y1": 386.7,
"r_x2": 286.4,
"r_y2": 377.8,
"r_x3": 148.7,
"r_y3": 377.8,
"coord_origin": "TOPLEFT"
},
"text": "Similar limitations appear also in",
"orig": "Similar limitations appear also in",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 398.6,
"r_x1": 286.4,
"r_y1": 398.6,
"r_x2": 286.4,
"r_y2": 389.7,
"r_x3": 50.1,
"r_y3": 389.7,
"coord_origin": "TOPLEFT"
},
"text": "the type of table content, which in some cases (e.g. FinTab-",
"orig": "the type of table content, which in some cases (e.g. FinTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 410.6,
"r_x1": 286.4,
"r_y1": 410.6,
"r_x2": 286.4,
"r_y2": 401.7,
"r_x3": 50.1,
"r_y3": 401.7,
"coord_origin": "TOPLEFT"
},
"text": "Net) is restricted to a certain domain. Ultimately, the lack",
"orig": "Net) is restricted to a certain domain. Ultimately, the lack",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 422.5,
"r_x1": 286.4,
"r_y1": 422.5,
"r_x2": 286.4,
"r_y2": 413.6,
"r_x3": 50.1,
"r_y3": 413.6,
"coord_origin": "TOPLEFT"
},
"text": "of diversity in the training dataset damages the ability of the",
"orig": "of diversity in the training dataset damages the ability of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 434.5,
"r_x1": 216.4,
"r_y1": 434.5,
"r_x2": 216.4,
"r_y2": 425.6,
"r_x3": 50.1,
"r_y3": 425.6,
"coord_origin": "TOPLEFT"
},
"text": "models to generalize well on unseen data.",
"orig": "models to generalize well on unseen data.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "As it is illustrated in Fig. 2, the table distributions from all datasets are skewed towards simpler structures with fewer number of rows/columns. Additionally, there is very limited variance in the table styles, which in case of PubTabNet and FinTabNet means one styling format for the majority of the tables. Similar limitations appear also in the type of table content, which in some cases (e.g. FinTabNet) is restricted to a certain domain. Ultimately, the lack of diversity in the training dataset damages the ability of the models to generalize well on unseen data."
},
{
"label": "text",
"id": 3,
"page_no": 3,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 50.1,
"t": 439.4,
"r": 286.4,
"b": 627.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 448.3,
"r_x1": 286.4,
"r_y1": 448.3,
"r_x2": 286.4,
"r_y2": 439.4,
"r_x3": 62.1,
"r_y3": 439.4,
"coord_origin": "TOPLEFT"
},
"text": "Motivated by those observations we aimed at generating",
"orig": "Motivated by those observations we aimed at generating",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 460.3,
"r_x1": 172.1,
"r_y1": 460.3,
"r_x2": 172.1,
"r_y2": 451.3,
"r_x3": 50.1,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": "a synthetic table dataset named",
"orig": "a synthetic table dataset named",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 174.1,
"r_y0": 460.0,
"r_x1": 224.7,
"r_y1": 460.0,
"r_x2": 224.7,
"r_y2": 451.4,
"r_x3": 174.1,
"r_y3": 451.4,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 224.7,
"r_y0": 460.3,
"r_x1": 286.4,
"r_y1": 460.3,
"r_x2": 286.4,
"r_y2": 451.3,
"r_x3": 224.7,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": ". This approach",
"orig": ". This approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 472.2,
"r_x1": 286.4,
"r_y1": 472.2,
"r_x2": 286.4,
"r_y2": 463.3,
"r_x3": 50.1,
"r_y3": 463.3,
"coord_origin": "TOPLEFT"
},
"text": "offers control over: 1) the size of the dataset, 2) the table",
"orig": "offers control over: 1) the size of the dataset, 2) the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 484.2,
"r_x1": 286.4,
"r_y1": 484.2,
"r_x2": 286.4,
"r_y2": 475.3,
"r_x3": 50.1,
"r_y3": 475.3,
"coord_origin": "TOPLEFT"
},
"text": "structure, 3) the table style and 4) the type of content. The",
"orig": "structure, 3) the table style and 4) the type of content. The",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 496.1,
"r_x1": 286.4,
"r_y1": 496.1,
"r_x2": 286.4,
"r_y2": 487.2,
"r_x3": 50.1,
"r_y3": 487.2,
"coord_origin": "TOPLEFT"
},
"text": "complexity of the table structure is described by the size of",
"orig": "complexity of the table structure is described by the size of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 508.1,
"r_x1": 286.4,
"r_y1": 508.1,
"r_x2": 286.4,
"r_y2": 499.2,
"r_x3": 50.1,
"r_y3": 499.2,
"coord_origin": "TOPLEFT"
},
"text": "the table header and the table body, as well as the percentage",
"orig": "the table header and the table body, as well as the percentage",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 520.0,
"r_x1": 286.4,
"r_y1": 520.0,
"r_x2": 286.4,
"r_y2": 511.1,
"r_x3": 50.1,
"r_y3": 511.1,
"coord_origin": "TOPLEFT"
},
"text": "of the table cells covered by row spans and column spans.",
"orig": "of the table cells covered by row spans and column spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 532.0,
"r_x1": 286.4,
"r_y1": 532.0,
"r_x2": 286.4,
"r_y2": 523.1,
"r_x3": 50.1,
"r_y3": 523.1,
"coord_origin": "TOPLEFT"
},
"text": "A set of carefully designed styling templates provides the",
"orig": "A set of carefully designed styling templates provides the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 543.9,
"r_x1": 286.4,
"r_y1": 543.9,
"r_x2": 286.4,
"r_y2": 535.0,
"r_x3": 50.1,
"r_y3": 535.0,
"coord_origin": "TOPLEFT"
},
"text": "basis to build a wide range of table appearances. Lastly, the",
"orig": "basis to build a wide range of table appearances. Lastly, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 555.9,
"r_x1": 286.4,
"r_y1": 555.9,
"r_x2": 286.4,
"r_y2": 547.0,
"r_x3": 50.1,
"r_y3": 547.0,
"coord_origin": "TOPLEFT"
},
"text": "table content is generated out of a curated collection of text",
"orig": "table content is generated out of a curated collection of text",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 567.8,
"r_x1": 286.4,
"r_y1": 567.8,
"r_x2": 286.4,
"r_y2": 558.9,
"r_x3": 50.1,
"r_y3": 558.9,
"coord_origin": "TOPLEFT"
},
"text": "corpora. By controlling the size and scope of the synthetic",
"orig": "corpora. By controlling the size and scope of the synthetic",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 579.8,
"r_x1": 286.4,
"r_y1": 579.8,
"r_x2": 286.4,
"r_y2": 570.9,
"r_x3": 50.1,
"r_y3": 570.9,
"coord_origin": "TOPLEFT"
},
"text": "datasets we are able to train and evaluate our models in a",
"orig": "datasets we are able to train and evaluate our models in a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 591.8,
"r_x1": 286.4,
"r_y1": 591.8,
"r_x2": 286.4,
"r_y2": 582.9,
"r_x3": 50.1,
"r_y3": 582.9,
"coord_origin": "TOPLEFT"
},
"text": "variety of different conditions. For example, we can first",
"orig": "variety of different conditions. For example, we can first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 603.7,
"r_x1": 286.4,
"r_y1": 603.7,
"r_x2": 286.4,
"r_y2": 594.8,
"r_x3": 50.1,
"r_y3": 594.8,
"coord_origin": "TOPLEFT"
},
"text": "generate a highly diverse dataset to train our models and",
"orig": "generate a highly diverse dataset to train our models and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 615.7,
"r_x1": 286.4,
"r_y1": 615.7,
"r_x2": 286.4,
"r_y2": 606.8,
"r_x3": 50.1,
"r_y3": 606.8,
"coord_origin": "TOPLEFT"
},
"text": "then evaluate their performance on other synthetic datasets",
"orig": "then evaluate their performance on other synthetic datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 627.6,
"r_x1": 209.8,
"r_y1": 627.6,
"r_x2": 209.8,
"r_y2": 618.7,
"r_x3": 50.1,
"r_y3": 618.7,
"coord_origin": "TOPLEFT"
},
"text": "which are focused on a specific domain.",
"orig": "which are focused on a specific domain.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Motivated by those observations we aimed at generating a synthetic table dataset named SynthTabNet . This approach offers control over: 1) the size of the dataset, 2) the table structure, 3) the table style and 4) the type of content. The complexity of the table structure is described by the size of the table header and the table body, as well as the percentage of the table cells covered by row spans and column spans. A set of carefully designed styling templates provides the basis to build a wide range of table appearances. Lastly, the table content is generated out of a curated collection of text corpora. By controlling the size and scope of the synthetic datasets we are able to train and evaluate our models in a variety of different conditions. For example, we can first generate a highly diverse dataset to train our models and then evaluate their performance on other synthetic datasets which are focused on a specific domain."
},
{
"label": "text",
"id": 5,
"page_no": 3,
"cluster": {
"id": 5,
"label": "text",
"bbox": {
"l": 50.1,
"t": 632.5,
"r": 286.4,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 641.4,
"r_x1": 286.4,
"r_y1": 641.4,
"r_x2": 286.4,
"r_y2": 632.5,
"r_x3": 62.1,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": "In this regard, we have prepared four synthetic datasets,",
"orig": "In this regard, we have prepared four synthetic datasets,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 653.4,
"r_x1": 286.4,
"r_y1": 653.4,
"r_x2": 286.4,
"r_y2": 644.5,
"r_x3": 50.1,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "each one containing 150k examples. The corpora to gener-",
"orig": "each one containing 150k examples. The corpora to gener-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 665.3,
"r_x1": 286.4,
"r_y1": 665.3,
"r_x2": 286.4,
"r_y2": 656.4,
"r_x3": 50.1,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "ate the table text consists of the most frequent terms appear-",
"orig": "ate the table text consists of the most frequent terms appear-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.3,
"r_x1": 286.4,
"r_y1": 677.3,
"r_x2": 286.4,
"r_y2": 668.4,
"r_x3": 50.1,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "ing in PubTabNet and FinTabNet together with randomly",
"orig": "ing in PubTabNet and FinTabNet together with randomly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 689.2,
"r_x1": 286.4,
"r_y1": 689.2,
"r_x2": 286.4,
"r_y2": 680.3,
"r_x3": 50.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "generated text. The first two synthetic datasets have been",
"orig": "generated text. The first two synthetic datasets have been",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "fine-tuned to mimic the appearance of the original datasets",
"orig": "fine-tuned to mimic the appearance of the original datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 286.4,
"r_y1": 713.2,
"r_x2": 286.4,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "but encompass more complicated table structures. The third",
"orig": "but encompass more complicated table structures. The third",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "In this regard, we have prepared four synthetic datasets, each one containing 150k examples. The corpora to generate the table text consists of the most frequent terms appearing in PubTabNet and FinTabNet together with randomly generated text. The first two synthetic datasets have been fine-tuned to mimic the appearance of the original datasets but encompass more complicated table structures. The third"
},
{
"label": "table",
"id": 8,
"page_no": 3,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 310.7,
"t": 73.2,
"r": 543.0,
"b": 155.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 412.3,
"r_y0": 82.5,
"r_x1": 430.9,
"r_y1": 82.5,
"r_x2": 430.9,
"r_y2": 73.6,
"r_x3": 412.3,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Tags",
"orig": "Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.9,
"r_y0": 82.5,
"r_x1": 464.4,
"r_y1": 82.5,
"r_x2": 464.4,
"r_y2": 73.6,
"r_x3": 442.9,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Bbox",
"orig": "Bbox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.8,
"r_y0": 82.5,
"r_x1": 494.9,
"r_y1": 82.5,
"r_x2": 494.9,
"r_y2": 73.6,
"r_x3": 477.8,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Size",
"orig": "Size",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.3,
"r_y0": 82.5,
"r_x1": 536.9,
"r_y1": 82.5,
"r_x2": 536.9,
"r_y2": 73.6,
"r_x3": 508.3,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Format",
"orig": "Format",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 94.9,
"r_x1": 361.6,
"r_y1": 94.9,
"r_x2": 361.6,
"r_y2": 86.0,
"r_x3": 317.1,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 94.9,
"r_x1": 425.4,
"r_y1": 94.9,
"r_x2": 425.4,
"r_y2": 85.7,
"r_x3": 417.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 94.9,
"r_x1": 457.4,
"r_y1": 94.9,
"r_x2": 457.4,
"r_y2": 85.7,
"r_x3": 449.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 94.9,
"r_x1": 496.3,
"r_y1": 94.9,
"r_x2": 496.3,
"r_y2": 86.0,
"r_x3": 476.4,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "509k",
"orig": "509k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 94.9,
"r_x1": 532.6,
"r_y1": 94.9,
"r_x2": 532.6,
"r_y2": 86.0,
"r_x3": 512.6,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 106.8,
"r_x1": 359.4,
"r_y1": 106.8,
"r_x2": 359.4,
"r_y2": 97.9,
"r_x3": 317.1,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 106.8,
"r_x1": 425.4,
"r_y1": 106.8,
"r_x2": 425.4,
"r_y2": 97.6,
"r_x3": 417.9,
"r_y3": 97.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 106.8,
"r_x1": 457.4,
"r_y1": 106.8,
"r_x2": 457.4,
"r_y2": 97.6,
"r_x3": 449.9,
"r_y3": 97.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 106.8,
"r_x1": 496.3,
"r_y1": 106.8,
"r_x2": 496.3,
"r_y2": 97.9,
"r_x3": 476.4,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "112k",
"orig": "112k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.5,
"r_y0": 106.8,
"r_x1": 531.7,
"r_y1": 106.8,
"r_x2": 531.7,
"r_y2": 97.9,
"r_x3": 513.5,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "PDF",
"orig": "PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 118.8,
"r_x1": 360.0,
"r_y1": 118.8,
"r_x2": 360.0,
"r_y2": 109.9,
"r_x3": 317.1,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "TableBank",
"orig": "TableBank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 118.8,
"r_x1": 425.4,
"r_y1": 118.8,
"r_x2": 425.4,
"r_y2": 109.6,
"r_x3": 417.9,
"r_y3": 109.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.8,
"r_y0": 118.8,
"r_x1": 456.5,
"r_y1": 118.8,
"r_x2": 456.5,
"r_y2": 109.6,
"r_x3": 450.8,
"r_y3": 109.6,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 118.8,
"r_x1": 496.3,
"r_y1": 118.8,
"r_x2": 496.3,
"r_y2": 109.9,
"r_x3": 476.4,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "145k",
"orig": "145k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.3,
"r_y0": 118.8,
"r_x1": 533.9,
"r_y1": 118.8,
"r_x2": 533.9,
"r_y2": 109.9,
"r_x3": 511.3,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "JPEG",
"orig": "JPEG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 130.7,
"r_x1": 400.4,
"r_y1": 130.7,
"r_x2": 400.4,
"r_y2": 121.8,
"r_x3": 317.1,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "Combined-Tabnet(*)",
"orig": "Combined-Tabnet(*)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 130.7,
"r_x1": 425.4,
"r_y1": 130.7,
"r_x2": 425.4,
"r_y2": 121.5,
"r_x3": 417.9,
"r_y3": 121.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 130.7,
"r_x1": 457.4,
"r_y1": 130.7,
"r_x2": 457.4,
"r_y2": 121.5,
"r_x3": 449.9,
"r_y3": 121.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 130.7,
"r_x1": 496.3,
"r_y1": 130.7,
"r_x2": 496.3,
"r_y2": 121.8,
"r_x3": 476.4,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "400k",
"orig": "400k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 130.7,
"r_x1": 532.6,
"r_y1": 130.7,
"r_x2": 532.6,
"r_y2": 121.8,
"r_x3": 512.6,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 142.7,
"r_x1": 375.2,
"r_y1": 142.7,
"r_x2": 375.2,
"r_y2": 133.8,
"r_x3": 317.1,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "Combined(**)",
"orig": "Combined(**)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 142.7,
"r_x1": 425.4,
"r_y1": 142.7,
"r_x2": 425.4,
"r_y2": 133.5,
"r_x3": 417.9,
"r_y3": 133.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 142.7,
"r_x1": 457.4,
"r_y1": 142.7,
"r_x2": 457.4,
"r_y2": 133.5,
"r_x3": 449.9,
"r_y3": 133.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 142.7,
"r_x1": 496.3,
"r_y1": 142.7,
"r_x2": 496.3,
"r_y2": 133.8,
"r_x3": 476.4,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "500k",
"orig": "500k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 142.7,
"r_x1": 532.6,
"r_y1": 142.7,
"r_x2": 532.6,
"r_y2": 133.8,
"r_x3": 512.6,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 154.6,
"r_x1": 369.4,
"r_y1": 154.6,
"r_x2": 369.4,
"r_y2": 145.7,
"r_x3": 317.1,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 154.7,
"r_x1": 425.4,
"r_y1": 154.7,
"r_x2": 425.4,
"r_y2": 145.4,
"r_x3": 417.9,
"r_y3": 145.4,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 154.7,
"r_x1": 457.4,
"r_y1": 154.7,
"r_x2": 457.4,
"r_y2": 145.4,
"r_x3": 449.9,
"r_y3": 145.4,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 154.6,
"r_x1": 496.3,
"r_y1": 154.6,
"r_x2": 496.3,
"r_y2": 145.7,
"r_x3": 476.4,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "600k",
"orig": "600k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 154.6,
"r_x1": 532.6,
"r_y1": 154.6,
"r_x2": 532.6,
"r_y2": 145.7,
"r_x3": 512.6,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 17,
"label": "text",
"bbox": {
"l": 412.3,
"t": 73.6,
"r": 430.9,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 412.3,
"r_y0": 82.5,
"r_x1": 430.9,
"r_y1": 82.5,
"r_x2": 430.9,
"r_y2": 73.6,
"r_x3": 412.3,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Tags",
"orig": "Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 18,
"label": "text",
"bbox": {
"l": 442.9,
"t": 73.6,
"r": 464.4,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 442.9,
"r_y0": 82.5,
"r_x1": 464.4,
"r_y1": 82.5,
"r_x2": 464.4,
"r_y2": 73.6,
"r_x3": 442.9,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Bbox",
"orig": "Bbox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 19,
"label": "text",
"bbox": {
"l": 477.8,
"t": 73.6,
"r": 494.9,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.8,
"r_y0": 82.5,
"r_x1": 494.9,
"r_y1": 82.5,
"r_x2": 494.9,
"r_y2": 73.6,
"r_x3": 477.8,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Size",
"orig": "Size",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 20,
"label": "text",
"bbox": {
"l": 508.3,
"t": 73.6,
"r": 536.9,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.3,
"r_y0": 82.5,
"r_x1": 536.9,
"r_y1": 82.5,
"r_x2": 536.9,
"r_y2": 73.6,
"r_x3": 508.3,
"r_y3": 73.6,
"coord_origin": "TOPLEFT"
},
"text": "Format",
"orig": "Format",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 21,
"label": "text",
"bbox": {
"l": 317.1,
"t": 86.0,
"r": 361.6,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 94.9,
"r_x1": 361.6,
"r_y1": 94.9,
"r_x2": 361.6,
"r_y2": 86.0,
"r_x3": 317.1,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 22,
"label": "text",
"bbox": {
"l": 417.9,
"t": 85.7,
"r": 425.4,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 94.9,
"r_x1": 425.4,
"r_y1": 94.9,
"r_x2": 425.4,
"r_y2": 85.7,
"r_x3": 417.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 23,
"label": "text",
"bbox": {
"l": 449.9,
"t": 85.7,
"r": 457.4,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 94.9,
"r_x1": 457.4,
"r_y1": 94.9,
"r_x2": 457.4,
"r_y2": 85.7,
"r_x3": 449.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 24,
"label": "text",
"bbox": {
"l": 476.4,
"t": 86.0,
"r": 496.3,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 94.9,
"r_x1": 496.3,
"r_y1": 94.9,
"r_x2": 496.3,
"r_y2": 86.0,
"r_x3": 476.4,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "509k",
"orig": "509k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 25,
"label": "text",
"bbox": {
"l": 512.6,
"t": 86.0,
"r": 532.6,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 94.9,
"r_x1": 532.6,
"r_y1": 94.9,
"r_x2": 532.6,
"r_y2": 86.0,
"r_x3": 512.6,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 26,
"label": "text",
"bbox": {
"l": 317.1,
"t": 97.9,
"r": 359.4,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 106.8,
"r_x1": 359.4,
"r_y1": 106.8,
"r_x2": 359.4,
"r_y2": 97.9,
"r_x3": 317.1,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 27,
"label": "text",
"bbox": {
"l": 417.9,
"t": 97.6,
"r": 425.4,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 106.8,
"r_x1": 425.4,
"r_y1": 106.8,
"r_x2": 425.4,
"r_y2": 97.6,
"r_x3": 417.9,
"r_y3": 97.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 28,
"label": "text",
"bbox": {
"l": 449.9,
"t": 97.6,
"r": 457.4,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 106.8,
"r_x1": 457.4,
"r_y1": 106.8,
"r_x2": 457.4,
"r_y2": 97.6,
"r_x3": 449.9,
"r_y3": 97.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "text",
"bbox": {
"l": 476.4,
"t": 97.9,
"r": 496.3,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 106.8,
"r_x1": 496.3,
"r_y1": 106.8,
"r_x2": 496.3,
"r_y2": 97.9,
"r_x3": 476.4,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "112k",
"orig": "112k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 30,
"label": "text",
"bbox": {
"l": 513.5,
"t": 97.9,
"r": 531.7,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.5,
"r_y0": 106.8,
"r_x1": 531.7,
"r_y1": 106.8,
"r_x2": 531.7,
"r_y2": 97.9,
"r_x3": 513.5,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "PDF",
"orig": "PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "text",
"bbox": {
"l": 317.1,
"t": 109.9,
"r": 360.0,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 118.8,
"r_x1": 360.0,
"r_y1": 118.8,
"r_x2": 360.0,
"r_y2": 109.9,
"r_x3": 317.1,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "TableBank",
"orig": "TableBank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 32,
"label": "text",
"bbox": {
"l": 417.9,
"t": 109.6,
"r": 425.4,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 118.8,
"r_x1": 425.4,
"r_y1": 118.8,
"r_x2": 425.4,
"r_y2": 109.6,
"r_x3": 417.9,
"r_y3": 109.6,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 33,
"label": "text",
"bbox": {
"l": 450.8,
"t": 109.6,
"r": 456.5,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.8,
"r_y0": 118.8,
"r_x1": 456.5,
"r_y1": 118.8,
"r_x2": 456.5,
"r_y2": 109.6,
"r_x3": 450.8,
"r_y3": 109.6,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 34,
"label": "text",
"bbox": {
"l": 476.4,
"t": 109.9,
"r": 496.3,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 118.8,
"r_x1": 496.3,
"r_y1": 118.8,
"r_x2": 496.3,
"r_y2": 109.9,
"r_x3": 476.4,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "145k",
"orig": "145k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 35,
"label": "text",
"bbox": {
"l": 511.3,
"t": 109.9,
"r": 533.9,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.3,
"r_y0": 118.8,
"r_x1": 533.9,
"r_y1": 118.8,
"r_x2": 533.9,
"r_y2": 109.9,
"r_x3": 511.3,
"r_y3": 109.9,
"coord_origin": "TOPLEFT"
},
"text": "JPEG",
"orig": "JPEG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 36,
"label": "text",
"bbox": {
"l": 317.1,
"t": 121.8,
"r": 400.4,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 130.7,
"r_x1": 400.4,
"r_y1": 130.7,
"r_x2": 400.4,
"r_y2": 121.8,
"r_x3": 317.1,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "Combined-Tabnet(*)",
"orig": "Combined-Tabnet(*)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 37,
"label": "text",
"bbox": {
"l": 417.9,
"t": 121.5,
"r": 425.4,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 130.7,
"r_x1": 425.4,
"r_y1": 130.7,
"r_x2": 425.4,
"r_y2": 121.5,
"r_x3": 417.9,
"r_y3": 121.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 38,
"label": "text",
"bbox": {
"l": 449.9,
"t": 121.5,
"r": 457.4,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 130.7,
"r_x1": 457.4,
"r_y1": 130.7,
"r_x2": 457.4,
"r_y2": 121.5,
"r_x3": 449.9,
"r_y3": 121.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 39,
"label": "text",
"bbox": {
"l": 476.4,
"t": 121.8,
"r": 496.3,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 130.7,
"r_x1": 496.3,
"r_y1": 130.7,
"r_x2": 496.3,
"r_y2": 121.8,
"r_x3": 476.4,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "400k",
"orig": "400k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 40,
"label": "text",
"bbox": {
"l": 512.6,
"t": 121.8,
"r": 532.6,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 130.7,
"r_x1": 532.6,
"r_y1": 130.7,
"r_x2": 532.6,
"r_y2": 121.8,
"r_x3": 512.6,
"r_y3": 121.8,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 317.1,
"t": 133.8,
"r": 375.2,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 142.7,
"r_x1": 375.2,
"r_y1": 142.7,
"r_x2": 375.2,
"r_y2": 133.8,
"r_x3": 317.1,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "Combined(**)",
"orig": "Combined(**)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 417.9,
"t": 133.5,
"r": 425.4,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 142.7,
"r_x1": 425.4,
"r_y1": 142.7,
"r_x2": 425.4,
"r_y2": 133.5,
"r_x3": 417.9,
"r_y3": 133.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 449.9,
"t": 133.5,
"r": 457.4,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 142.7,
"r_x1": 457.4,
"r_y1": 142.7,
"r_x2": 457.4,
"r_y2": 133.5,
"r_x3": 449.9,
"r_y3": 133.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 476.4,
"t": 133.8,
"r": 496.3,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 142.7,
"r_x1": 496.3,
"r_y1": 142.7,
"r_x2": 496.3,
"r_y2": 133.8,
"r_x3": 476.4,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "500k",
"orig": "500k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 512.6,
"t": 133.8,
"r": 532.6,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 142.7,
"r_x1": 532.6,
"r_y1": 142.7,
"r_x2": 532.6,
"r_y2": 133.8,
"r_x3": 512.6,
"r_y3": 133.8,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 317.1,
"t": 145.7,
"r": 369.4,
"b": 154.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 317.1,
"r_y0": 154.6,
"r_x1": 369.4,
"r_y1": 154.6,
"r_x2": 369.4,
"r_y2": 145.7,
"r_x3": 317.1,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 417.9,
"t": 145.4,
"r": 425.4,
"b": 154.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.9,
"r_y0": 154.7,
"r_x1": 425.4,
"r_y1": 154.7,
"r_x2": 425.4,
"r_y2": 145.4,
"r_x3": 417.9,
"r_y3": 145.4,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 449.9,
"t": 145.4,
"r": 457.4,
"b": 154.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 154.7,
"r_x1": 457.4,
"r_y1": 154.7,
"r_x2": 457.4,
"r_y2": 145.4,
"r_x3": 449.9,
"r_y3": 145.4,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 476.4,
"t": 145.7,
"r": 496.3,
"b": 154.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.4,
"r_y0": 154.6,
"r_x1": 496.3,
"r_y1": 154.6,
"r_x2": 496.3,
"r_y2": 145.7,
"r_x3": 476.4,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "600k",
"orig": "600k",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 512.6,
"t": 145.7,
"r": 532.6,
"b": 154.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 512.6,
"r_y0": 154.6,
"r_x1": 532.6,
"r_y1": 154.6,
"r_x2": 532.6,
"r_y2": 145.7,
"r_x3": 512.6,
"r_y3": 145.7,
"coord_origin": "TOPLEFT"
},
"text": "PNG",
"orig": "PNG",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 7,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 412.3,
"t": 73.6,
"r": 430.9,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Tags",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 442.9,
"t": 73.6,
"r": 464.4,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "Bbox",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 477.8,
"t": 73.6,
"r": 494.9,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "Size",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 508.3,
"t": 73.6,
"r": 536.9,
"b": 82.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "Format",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.1,
"t": 86.0,
"r": 361.6,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "PubTabNet",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.9,
"t": 85.7,
"r": 425.4,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 85.7,
"r": 457.4,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 86.0,
"r": 496.3,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "509k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.6,
"t": 86.0,
"r": 532.6,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.1,
"t": 97.9,
"r": 359.4,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "FinTabNet",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.9,
"t": 97.6,
"r": 425.4,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 97.6,
"r": 457.4,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 97.9,
"r": 496.3,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "112k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 513.5,
"t": 97.9,
"r": 531.7,
"b": 106.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PDF",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.1,
"t": 109.9,
"r": 360.0,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableBank",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.9,
"t": 109.6,
"r": 425.4,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 450.8,
"t": 109.6,
"r": 456.5,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 109.9,
"r": 496.3,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "145k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 511.3,
"t": 109.9,
"r": 533.9,
"b": 118.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "JPEG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.1,
"t": 121.8,
"r": 400.4,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Combined-Tabnet(*)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.9,
"t": 121.5,
"r": 425.4,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 121.5,
"r": 457.4,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 121.8,
"r": 496.3,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "400k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.6,
"t": 121.8,
"r": 532.6,
"b": 130.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.1,
"t": 133.8,
"r": 375.2,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Combined(**)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.9,
"t": 133.5,
"r": 425.4,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 133.5,
"r": 457.4,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 133.8,
"r": 496.3,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "500k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.6,
"t": 133.8,
"r": 532.6,
"b": 142.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 317.1,
"t": 145.7,
"r": 369.4,
"b": 154.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "SynthTabNet",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 417.9,
"t": 145.4,
"r": 425.4,
"b": 154.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.9,
"t": 145.4,
"r": 457.4,
"b": 154.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 476.4,
"t": 145.7,
"r": 496.3,
"b": 154.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "600k",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 512.6,
"t": 145.7,
"r": 532.6,
"b": 154.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PNG",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 9,
"page_no": 3,
"cluster": {
"id": 9,
"label": "caption",
"bbox": {
"l": 308.9,
"t": 167.7,
"r": 545.1,
"b": 224.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 176.6,
"r_x1": 344.6,
"r_y1": 176.6,
"r_x2": 344.6,
"r_y2": 167.7,
"r_x3": 308.9,
"r_y3": 167.7,
"coord_origin": "TOPLEFT"
},
"text": "Table 1:",
"orig": "Table 1:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 361.1,
"r_y0": 176.6,
"r_x1": 380.5,
"r_y1": 176.6,
"r_x2": 380.5,
"r_y2": 167.7,
"r_x3": 361.1,
"r_y3": 167.7,
"coord_origin": "TOPLEFT"
},
"text": "Both",
"orig": "Both",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 386.6,
"r_y0": 176.3,
"r_x1": 468.7,
"r_y1": 176.3,
"r_x2": 468.7,
"r_y2": 167.8,
"r_x3": 386.6,
"r_y3": 167.8,
"coord_origin": "TOPLEFT"
},
"text": "\u201cCombined-Tabnet\u201d",
"orig": "\u201cCombined-Tabnet\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 474.8,
"r_y0": 176.6,
"r_x1": 489.2,
"r_y1": 176.6,
"r_x2": 489.2,
"r_y2": 167.7,
"r_x3": 474.8,
"r_y3": 167.7,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 495.3,
"r_y0": 176.3,
"r_x1": 545.1,
"r_y1": 176.3,
"r_x2": 545.1,
"r_y2": 167.8,
"r_x3": 495.3,
"r_y3": 167.8,
"coord_origin": "TOPLEFT"
},
"text": "\u201dCombined-",
"orig": "\u201dCombined-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 188.3,
"r_x1": 341.2,
"r_y1": 188.3,
"r_x2": 341.2,
"r_y2": 179.7,
"r_x3": 308.9,
"r_y3": 179.7,
"coord_origin": "TOPLEFT"
},
"text": "Tabnet\u201d",
"orig": "Tabnet\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 343.5,
"r_y0": 188.5,
"r_x1": 545.1,
"r_y1": 188.5,
"r_x2": 545.1,
"r_y2": 179.6,
"r_x3": 343.5,
"r_y3": 179.6,
"coord_origin": "TOPLEFT"
},
"text": "are variations of the following: (*) The Combined-",
"orig": "are variations of the following: (*) The Combined-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 200.5,
"r_x1": 545.1,
"r_y1": 200.5,
"r_x2": 545.1,
"r_y2": 191.6,
"r_x3": 308.9,
"r_y3": 191.6,
"coord_origin": "TOPLEFT"
},
"text": "Tabnet dataset is the processed combination of PubTabNet",
"orig": "Tabnet dataset is the processed combination of PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 212.4,
"r_x1": 545.1,
"r_y1": 212.4,
"r_x2": 545.1,
"r_y2": 203.5,
"r_x3": 308.9,
"r_y3": 203.5,
"coord_origin": "TOPLEFT"
},
"text": "and Fintabnet. (**) The combined dataset is the processed",
"orig": "and Fintabnet. (**) The combined dataset is the processed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 224.4,
"r_x1": 523.9,
"r_y1": 224.4,
"r_x2": 523.9,
"r_y2": 215.5,
"r_x3": 308.9,
"r_y3": 215.5,
"coord_origin": "TOPLEFT"
},
"text": "combination of PubTabNet, Fintabnet and TableBank.",
"orig": "combination of PubTabNet, Fintabnet and TableBank.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Table 1: Both \"Combined-Tabnet\" and \"CombinedTabnet\" are variations of the following: (*) The CombinedTabnet dataset is the processed combination of PubTabNet and Fintabnet. (**) The combined dataset is the processed combination of PubTabNet, Fintabnet and TableBank."
},
{
"label": "text",
"id": 6,
"page_no": 3,
"cluster": {
"id": 6,
"label": "text",
"bbox": {
"l": 308.9,
"t": 249.6,
"r": 545.1,
"b": 294.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 258.5,
"r_x1": 545.1,
"r_y1": 258.5,
"r_x2": 545.1,
"r_y2": 249.6,
"r_x3": 308.9,
"r_y3": 249.6,
"coord_origin": "TOPLEFT"
},
"text": "one adopts a colorful appearance with high contrast and the",
"orig": "one adopts a colorful appearance with high contrast and the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 270.5,
"r_x1": 545.1,
"r_y1": 270.5,
"r_x2": 545.1,
"r_y2": 261.6,
"r_x3": 308.9,
"r_y3": 261.6,
"coord_origin": "TOPLEFT"
},
"text": "last one contains tables with sparse content. Lastly, we have",
"orig": "last one contains tables with sparse content. Lastly, we have",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 282.4,
"r_x1": 545.1,
"r_y1": 282.4,
"r_x2": 545.1,
"r_y2": 273.5,
"r_x3": 308.9,
"r_y3": 273.5,
"coord_origin": "TOPLEFT"
},
"text": "combined all synthetic datasets into one big unified syn-",
"orig": "combined all synthetic datasets into one big unified syn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 294.4,
"r_x1": 436.8,
"r_y1": 294.4,
"r_x2": 436.8,
"r_y2": 285.5,
"r_x3": 308.9,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "thetic dataset of 600k examples.",
"orig": "thetic dataset of 600k examples.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "one adopts a colorful appearance with high contrast and the last one contains tables with sparse content. Lastly, we have combined all synthetic datasets into one big unified synthetic dataset of 600k examples."
},
{
"label": "text",
"id": 13,
"page_no": 3,
"cluster": {
"id": 13,
"label": "text",
"bbox": {
"l": 320.8,
"t": 297.8,
"r": 542.7,
"b": 306.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 306.7,
"r_x1": 542.7,
"r_y1": 306.7,
"r_x2": 542.7,
"r_y2": 297.8,
"r_x3": 320.8,
"r_y3": 297.8,
"coord_origin": "TOPLEFT"
},
"text": "Tab. 1 summarizes the various attributes of the datasets.",
"orig": "Tab. 1 summarizes the various attributes of the datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Tab. 1 summarizes the various attributes of the datasets."
},
{
"label": "section_header",
"id": 11,
"page_no": 3,
"cluster": {
"id": 11,
"label": "section_header",
"bbox": {
"l": 308.9,
"t": 321.2,
"r": 444.9,
"b": 331.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 331.9,
"r_x1": 316.3,
"r_y1": 331.9,
"r_x2": 316.3,
"r_y2": 321.2,
"r_x3": 308.9,
"r_y3": 321.2,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.2,
"r_y0": 331.9,
"r_x1": 444.9,
"r_y1": 331.9,
"r_x2": 444.9,
"r_y2": 321.2,
"r_x3": 326.2,
"r_y3": 321.2,
"coord_origin": "TOPLEFT"
},
"text": "The TableFormer model",
"orig": "The TableFormer model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "4. The TableFormer model"
},
{
"label": "text",
"id": 0,
"page_no": 3,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 308.9,
"t": 341.9,
"r": 545.1,
"b": 446.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 350.8,
"r_x1": 545.1,
"r_y1": 350.8,
"r_x2": 545.1,
"r_y2": 341.9,
"r_x3": 320.8,
"r_y3": 341.9,
"coord_origin": "TOPLEFT"
},
"text": "Given the image of a table, TableFormer is able to pre-",
"orig": "Given the image of a table, TableFormer is able to pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 362.8,
"r_x1": 545.1,
"r_y1": 362.8,
"r_x2": 545.1,
"r_y2": 353.9,
"r_x3": 308.9,
"r_y3": 353.9,
"coord_origin": "TOPLEFT"
},
"text": "dict: 1) a sequence of tokens that represent the structure of",
"orig": "dict: 1) a sequence of tokens that represent the structure of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 374.8,
"r_x1": 545.1,
"r_y1": 374.8,
"r_x2": 545.1,
"r_y2": 365.8,
"r_x3": 308.9,
"r_y3": 365.8,
"coord_origin": "TOPLEFT"
},
"text": "a table, and 2) a bounding box coupled to a subset of those",
"orig": "a table, and 2) a bounding box coupled to a subset of those",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 386.7,
"r_x1": 545.1,
"r_y1": 386.7,
"r_x2": 545.1,
"r_y2": 377.8,
"r_x3": 308.9,
"r_y3": 377.8,
"coord_origin": "TOPLEFT"
},
"text": "tokens. The conversion of an image into a sequence of to-",
"orig": "tokens. The conversion of an image into a sequence of to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 398.7,
"r_x1": 545.1,
"r_y1": 398.7,
"r_x2": 545.1,
"r_y2": 389.8,
"r_x3": 308.9,
"r_y3": 389.8,
"coord_origin": "TOPLEFT"
},
"text": "kens is a well-known task [35, 16]. While attention is often",
"orig": "kens is a well-known task [35, 16]. While attention is often",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 410.6,
"r_x1": 545.1,
"r_y1": 410.6,
"r_x2": 545.1,
"r_y2": 401.7,
"r_x3": 308.9,
"r_y3": 401.7,
"coord_origin": "TOPLEFT"
},
"text": "used as an implicit method to associate each token of the",
"orig": "used as an implicit method to associate each token of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 422.6,
"r_x1": 545.1,
"r_y1": 422.6,
"r_x2": 545.1,
"r_y2": 413.7,
"r_x3": 308.9,
"r_y3": 413.7,
"coord_origin": "TOPLEFT"
},
"text": "sequence with a position in the original image, an explicit",
"orig": "sequence with a position in the original image, an explicit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 434.5,
"r_x1": 545.1,
"r_y1": 434.5,
"r_x2": 545.1,
"r_y2": 425.6,
"r_x3": 308.9,
"r_y3": 425.6,
"coord_origin": "TOPLEFT"
},
"text": "association between the individual table-cells and the image",
"orig": "association between the individual table-cells and the image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 446.5,
"r_x1": 437.9,
"r_y1": 446.5,
"r_x2": 437.9,
"r_y2": 437.6,
"r_x3": 308.9,
"r_y3": 437.6,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes is also required.",
"orig": "bounding boxes is also required.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Given the image of a table, TableFormer is able to predict: 1) a sequence of tokens that represent the structure of a table, and 2) a bounding box coupled to a subset of those tokens. The conversion of an image into a sequence of tokens is a well-known task [35, 16]. While attention is often used as an implicit method to associate each token of the sequence with a position in the original image, an explicit association between the individual table-cells and the image bounding boxes is also required."
},
{
"label": "section_header",
"id": 12,
"page_no": 3,
"cluster": {
"id": 12,
"label": "section_header",
"bbox": {
"l": 308.9,
"t": 457.7,
"r": 420.2,
"b": 467.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 467.5,
"r_x1": 323.1,
"r_y1": 467.5,
"r_x2": 323.1,
"r_y2": 457.7,
"r_x3": 308.9,
"r_y3": 457.7,
"coord_origin": "TOPLEFT"
},
"text": "4.1.",
"orig": "4.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 332.7,
"r_y0": 467.5,
"r_x1": 420.2,
"r_y1": 467.5,
"r_x2": 420.2,
"r_y2": 457.7,
"r_x3": 332.7,
"r_y3": 457.7,
"coord_origin": "TOPLEFT"
},
"text": "Model architecture.",
"orig": "Model architecture.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "4.1. Model architecture."
},
{
"label": "text",
"id": 2,
"page_no": 3,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 308.9,
"t": 476.8,
"r": 545.1,
"b": 665.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 485.7,
"r_x1": 545.1,
"r_y1": 485.7,
"r_x2": 545.1,
"r_y2": 476.8,
"r_x3": 320.8,
"r_y3": 476.8,
"coord_origin": "TOPLEFT"
},
"text": "We now describe in detail the proposed method, which",
"orig": "We now describe in detail the proposed method, which",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 497.6,
"r_x1": 509.0,
"r_y1": 497.6,
"r_x2": 509.0,
"r_y2": 488.7,
"r_x3": 308.9,
"r_y3": 488.7,
"coord_origin": "TOPLEFT"
},
"text": "is composed of three main components, see Fig.",
"orig": "is composed of three main components, see Fig.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.6,
"r_y0": 497.6,
"r_x1": 523.1,
"r_y1": 497.6,
"r_x2": 523.1,
"r_y2": 488.7,
"r_x3": 515.6,
"r_y3": 488.7,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 529.6,
"r_y0": 497.6,
"r_x1": 545.1,
"r_y1": 497.6,
"r_x2": 545.1,
"r_y2": 488.7,
"r_x3": 529.6,
"r_y3": 488.7,
"coord_origin": "TOPLEFT"
},
"text": "Our",
"orig": "Our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 509.4,
"r_x1": 406.3,
"r_y1": 509.4,
"r_x2": 406.3,
"r_y2": 500.8,
"r_x3": 308.9,
"r_y3": 500.8,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network",
"orig": "CNN Backbone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.9,
"r_y0": 509.6,
"r_x1": 545.1,
"r_y1": 509.6,
"r_x2": 545.1,
"r_y2": 500.7,
"r_x3": 408.9,
"r_y3": 500.7,
"coord_origin": "TOPLEFT"
},
"text": "encodes the input as a feature vec-",
"orig": "encodes the input as a feature vec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 521.5,
"r_x1": 409.4,
"r_y1": 521.5,
"r_x2": 409.4,
"r_y2": 512.6,
"r_x3": 308.9,
"r_y3": 512.6,
"coord_origin": "TOPLEFT"
},
"text": "tor of predefined length.",
"orig": "tor of predefined length.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 416.7,
"r_y0": 521.5,
"r_x1": 545.1,
"r_y1": 521.5,
"r_x2": 545.1,
"r_y2": 512.6,
"r_x3": 416.7,
"r_y3": 512.6,
"coord_origin": "TOPLEFT"
},
"text": "The input feature vector of the",
"orig": "The input feature vector of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 533.5,
"r_x1": 436.2,
"r_y1": 533.5,
"r_x2": 436.2,
"r_y2": 524.6,
"r_x3": 308.9,
"r_y3": 524.6,
"coord_origin": "TOPLEFT"
},
"text": "encoded image is passed to the",
"orig": "encoded image is passed to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 439.5,
"r_y0": 533.3,
"r_x1": 513.9,
"r_y1": 533.3,
"r_x2": 513.9,
"r_y2": 524.7,
"r_x3": 439.5,
"r_y3": 524.7,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 517.4,
"r_y0": 533.5,
"r_x1": 545.1,
"r_y1": 533.5,
"r_x2": 545.1,
"r_y2": 524.6,
"r_x3": 517.4,
"r_y3": 524.6,
"coord_origin": "TOPLEFT"
},
"text": "to pro-",
"orig": "to pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 545.4,
"r_x1": 545.1,
"r_y1": 545.4,
"r_x2": 545.1,
"r_y2": 536.5,
"r_x3": 308.9,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "duce a sequence of HTML tags that represent the structure",
"orig": "duce a sequence of HTML tags that represent the structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 557.4,
"r_x1": 358.5,
"r_y1": 557.4,
"r_x2": 358.5,
"r_y2": 548.5,
"r_x3": 308.9,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "of the table.",
"orig": "of the table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 365.2,
"r_y0": 557.4,
"r_x1": 545.1,
"r_y1": 557.4,
"r_x2": 545.1,
"r_y2": 548.5,
"r_x3": 365.2,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "With each prediction of an HTML standard",
"orig": "With each prediction of an HTML standard",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 569.4,
"r_x1": 352.4,
"r_y1": 569.4,
"r_x2": 352.4,
"r_y2": 560.5,
"r_x3": 308.9,
"r_y3": 560.5,
"coord_origin": "TOPLEFT"
},
"text": "data cell (\u2018",
"orig": "data cell (\u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.4,
"r_y0": 569.1,
"r_x1": 360.2,
"r_y1": 569.1,
"r_x2": 360.2,
"r_y2": 560.3,
"r_x3": 352.4,
"r_y3": 560.3,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.2,
"r_y0": 569.4,
"r_x1": 367.9,
"r_y1": 569.4,
"r_x2": 367.9,
"r_y2": 560.5,
"r_x3": 360.2,
"r_y3": 560.5,
"coord_origin": "TOPLEFT"
},
"text": "td",
"orig": "td",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.9,
"r_y0": 569.1,
"r_x1": 375.7,
"r_y1": 569.1,
"r_x2": 375.7,
"r_y2": 560.3,
"r_x3": 367.9,
"r_y3": 560.3,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 375.7,
"r_y0": 569.4,
"r_x1": 545.1,
"r_y1": 569.4,
"r_x2": 545.1,
"r_y2": 560.5,
"r_x3": 375.7,
"r_y3": 560.5,
"coord_origin": "TOPLEFT"
},
"text": "\u2019) the hidden state of that cell is passed to",
"orig": "\u2019) the hidden state of that cell is passed to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 581.3,
"r_x1": 545.1,
"r_y1": 581.3,
"r_x2": 545.1,
"r_y2": 572.4,
"r_x3": 308.9,
"r_y3": 572.4,
"coord_origin": "TOPLEFT"
},
"text": "the Cell BBox Decoder. As for spanning cells, such as row",
"orig": "the Cell BBox Decoder. As for spanning cells, such as row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 593.3,
"r_x1": 483.1,
"r_y1": 593.3,
"r_x2": 483.1,
"r_y2": 584.4,
"r_x3": 308.9,
"r_y3": 584.4,
"coord_origin": "TOPLEFT"
},
"text": "or column span, the tag is broken down to \u2018",
"orig": "or column span, the tag is broken down to \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.1,
"r_y0": 593.0,
"r_x1": 490.9,
"r_y1": 593.0,
"r_x2": 490.9,
"r_y2": 584.2,
"r_x3": 483.1,
"r_y3": 584.2,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.9,
"r_y0": 593.3,
"r_x1": 545.1,
"r_y1": 593.3,
"r_x2": 545.1,
"r_y2": 584.4,
"r_x3": 490.9,
"r_y3": 584.4,
"coord_origin": "TOPLEFT"
},
"text": "\u2019, \u2018rowspan=\u2019",
"orig": "\u2019, \u2018rowspan=\u2019",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 605.2,
"r_x1": 545.1,
"r_y1": 605.2,
"r_x2": 545.1,
"r_y2": 596.3,
"r_x3": 308.9,
"r_y3": 596.3,
"coord_origin": "TOPLEFT"
},
"text": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),",
"orig": "or \u2018colspan=\u2019, with the number of spanning cells (attribute),",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 617.2,
"r_x1": 329.6,
"r_y1": 617.2,
"r_x2": 329.6,
"r_y2": 608.3,
"r_x3": 308.9,
"r_y3": 608.3,
"coord_origin": "TOPLEFT"
},
"text": "and \u2018",
"orig": "and \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 329.6,
"r_y0": 617.0,
"r_x1": 337.4,
"r_y1": 617.0,
"r_x2": 337.4,
"r_y2": 608.1,
"r_x3": 329.6,
"r_y3": 608.1,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 337.4,
"r_y0": 617.2,
"r_x1": 468.6,
"r_y1": 617.2,
"r_x2": 468.6,
"r_y2": 608.3,
"r_x3": 337.4,
"r_y3": 608.3,
"coord_origin": "TOPLEFT"
},
"text": "\u2019. The hidden state attached to \u2018",
"orig": "\u2019. The hidden state attached to \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.6,
"r_y0": 617.0,
"r_x1": 476.3,
"r_y1": 617.0,
"r_x2": 476.3,
"r_y2": 608.1,
"r_x3": 468.6,
"r_y3": 608.1,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.3,
"r_y0": 617.2,
"r_x1": 545.1,
"r_y1": 617.2,
"r_x2": 545.1,
"r_y2": 608.3,
"r_x3": 476.3,
"r_y3": 608.3,
"coord_origin": "TOPLEFT"
},
"text": "\u2019 is passed to the",
"orig": "\u2019 is passed to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 629.1,
"r_x1": 545.1,
"r_y1": 629.1,
"r_x2": 545.1,
"r_y2": 620.2,
"r_x3": 308.9,
"r_y3": 620.2,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder. A shared feed forward network (FFN)",
"orig": "Cell BBox Decoder. A shared feed forward network (FFN)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 641.1,
"r_x1": 545.1,
"r_y1": 641.1,
"r_x2": 545.1,
"r_y2": 632.2,
"r_x3": 308.9,
"r_y3": 632.2,
"coord_origin": "TOPLEFT"
},
"text": "receives the hidden states from the Structure Decoder, to",
"orig": "receives the hidden states from the Structure Decoder, to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 653.0,
"r_x1": 545.1,
"r_y1": 653.0,
"r_x2": 545.1,
"r_y2": 644.1,
"r_x3": 308.9,
"r_y3": 644.1,
"coord_origin": "TOPLEFT"
},
"text": "provide the final detection predictions of the bounding box",
"orig": "provide the final detection predictions of the bounding box",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 665.0,
"r_x1": 449.4,
"r_y1": 665.0,
"r_x2": 449.4,
"r_y2": 656.1,
"r_x3": 308.9,
"r_y3": 656.1,
"coord_origin": "TOPLEFT"
},
"text": "coordinates and their classification.",
"orig": "coordinates and their classification.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "We now describe in detail the proposed method, which is composed of three main components, see Fig. 4. Our CNN Backbone Network encodes the input as a feature vector of predefined length. The input feature vector of the encoded image is passed to the Structure Decoder to produce a sequence of HTML tags that represent the structure of the table. With each prediction of an HTML standard data cell (' < td > ') the hidden state of that cell is passed to the Cell BBox Decoder. As for spanning cells, such as row or column span, the tag is broken down to ' < ', 'rowspan=' or 'colspan=', with the number of spanning cells (attribute), and ' > '. The hidden state attached to ' < ' is passed to the Cell BBox Decoder. A shared feed forward network (FFN) receives the hidden states from the Structure Decoder, to provide the final detection predictions of the bounding box coordinates and their classification."
},
{
"label": "text",
"id": 7,
"page_no": 3,
"cluster": {
"id": 7,
"label": "text",
"bbox": {
"l": 308.9,
"t": 668.3,
"r": 545.1,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 677.2,
"r_x1": 431.9,
"r_y1": 677.2,
"r_x2": 431.9,
"r_y2": 668.3,
"r_x3": 320.8,
"r_y3": 668.3,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network.",
"orig": "CNN Backbone Network.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 439.5,
"r_y0": 677.3,
"r_x1": 545.1,
"r_y1": 677.3,
"r_x2": 545.1,
"r_y2": 668.4,
"r_x3": 439.5,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "A ResNet-18 CNN is the",
"orig": "A ResNet-18 CNN is the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 689.2,
"r_x1": 545.1,
"r_y1": 689.2,
"r_x2": 545.1,
"r_y2": 680.3,
"r_x3": 308.9,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "backbone that receives the table image and encodes it as a",
"orig": "backbone that receives the table image and encodes it as a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 308.9,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "vector of predefined length. The network has been modified",
"orig": "vector of predefined length. The network has been modified",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 545.1,
"r_y1": 713.2,
"r_x2": 545.1,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "by removing the linear and pooling layer, as we are not per-",
"orig": "by removing the linear and pooling layer, as we are not per-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "CNN Backbone Network. A ResNet-18 CNN is the backbone that receives the table image and encodes it as a vector of predefined length. The network has been modified by removing the linear and pooling layer, as we are not per-"
}
],
"headers": [
{
"label": "page_footer",
"id": 14,
"page_no": 3,
"cluster": {
"id": 14,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.86,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "4"
}
]
}
},
{
"page_no": 4,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.7,
"r_y0": 125.6,
"r_x1": 84.9,
"r_y1": 125.6,
"r_x2": 84.9,
"r_y2": 122.4,
"r_x3": 81.7,
"r_y3": 122.4,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.5,
"r_y0": 125.6,
"r_x1": 93.0,
"r_y1": 125.6,
"r_x2": 93.0,
"r_y2": 122.4,
"r_x3": 86.5,
"r_y3": 122.4,
"coord_origin": "TOPLEFT"
},
"text": "Item",
"orig": "Item",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 102.5,
"r_y0": 118.4,
"r_x1": 115.3,
"r_y1": 118.4,
"r_x2": 115.3,
"r_y2": 115.3,
"r_x3": 102.5,
"r_y3": 115.3,
"coord_origin": "TOPLEFT"
},
"text": "Amount",
"orig": "Amount",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.1,
"r_y0": 118.4,
"r_x1": 93.3,
"r_y1": 118.4,
"r_x2": 93.3,
"r_y2": 115.2,
"r_x3": 82.1,
"r_y3": 115.2,
"coord_origin": "TOPLEFT"
},
"text": "Names",
"orig": "Names",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 96.7,
"r_y0": 125.6,
"r_x1": 104.3,
"r_y1": 125.6,
"r_x2": 104.3,
"r_y2": 122.4,
"r_x3": 96.7,
"r_y3": 122.4,
"coord_origin": "TOPLEFT"
},
"text": "1000",
"orig": "1000",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 96.7,
"r_y0": 130.9,
"r_x1": 102.4,
"r_y1": 130.9,
"r_x2": 102.4,
"r_y2": 127.7,
"r_x3": 96.7,
"r_y3": 127.7,
"coord_origin": "TOPLEFT"
},
"text": "500",
"orig": "500",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 96.7,
"r_y0": 136.6,
"r_x1": 104.3,
"r_y1": 136.6,
"r_x2": 104.3,
"r_y2": 133.5,
"r_x3": 96.7,
"r_y3": 133.5,
"coord_origin": "TOPLEFT"
},
"text": "3500",
"orig": "3500",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 96.7,
"r_y0": 142.4,
"r_x1": 102.4,
"r_y1": 142.4,
"r_x2": 102.4,
"r_y2": 139.2,
"r_x3": 96.7,
"r_y3": 139.2,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.7,
"r_y0": 125.6,
"r_x1": 116.1,
"r_y1": 125.6,
"r_x2": 116.1,
"r_y2": 122.4,
"r_x3": 110.7,
"r_y3": 122.4,
"coord_origin": "TOPLEFT"
},
"text": "unit",
"orig": "unit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.7,
"r_y0": 130.9,
"r_x1": 116.1,
"r_y1": 130.9,
"r_x2": 116.1,
"r_y2": 127.7,
"r_x3": 110.7,
"r_y3": 127.7,
"coord_origin": "TOPLEFT"
},
"text": "unit",
"orig": "unit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.7,
"r_y0": 136.6,
"r_x1": 116.1,
"r_y1": 136.6,
"r_x2": 116.1,
"r_y2": 133.5,
"r_x3": 110.7,
"r_y3": 133.5,
"coord_origin": "TOPLEFT"
},
"text": "unit",
"orig": "unit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.7,
"r_y0": 142.4,
"r_x1": 116.1,
"r_y1": 142.4,
"r_x2": 116.1,
"r_y2": 139.2,
"r_x3": 110.7,
"r_y3": 139.2,
"coord_origin": "TOPLEFT"
},
"text": "unit",
"orig": "unit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.7,
"r_y0": 130.9,
"r_x1": 84.9,
"r_y1": 130.9,
"r_x2": 84.9,
"r_y2": 127.7,
"r_x3": 81.7,
"r_y3": 127.7,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.5,
"r_y0": 130.9,
"r_x1": 93.0,
"r_y1": 130.9,
"r_x2": 93.0,
"r_y2": 127.7,
"r_x3": 86.5,
"r_y3": 127.7,
"coord_origin": "TOPLEFT"
},
"text": "Item",
"orig": "Item",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.7,
"r_y0": 136.6,
"r_x1": 84.9,
"r_y1": 136.6,
"r_x2": 84.9,
"r_y2": 133.5,
"r_x3": 81.7,
"r_y3": 133.5,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.5,
"r_y0": 136.6,
"r_x1": 93.0,
"r_y1": 136.6,
"r_x2": 93.0,
"r_y2": 133.5,
"r_x3": 86.5,
"r_y3": 133.5,
"coord_origin": "TOPLEFT"
},
"text": "Item",
"orig": "Item",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.7,
"r_y0": 142.4,
"r_x1": 84.9,
"r_y1": 142.4,
"r_x2": 84.9,
"r_y2": 139.2,
"r_x3": 81.7,
"r_y3": 139.2,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.5,
"r_y0": 142.4,
"r_x1": 93.0,
"r_y1": 142.4,
"r_x2": 93.0,
"r_y2": 139.2,
"r_x3": 86.5,
"r_y3": 139.2,
"coord_origin": "TOPLEFT"
},
"text": "Item",
"orig": "Item",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.1,
"r_y0": 96.2,
"r_x1": 113.9,
"r_y1": 96.2,
"r_x2": 113.9,
"r_y2": 90.5,
"r_x3": 88.1,
"r_y3": 90.5,
"coord_origin": "TOPLEFT"
},
"text": "Extracted",
"orig": "Extracted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.8,
"r_y0": 103.4,
"r_x1": 119.2,
"r_y1": 103.4,
"r_x2": 119.2,
"r_y2": 97.6,
"r_x3": 82.8,
"r_y3": 97.6,
"coord_origin": "TOPLEFT"
},
"text": "Table Images",
"orig": "Table Images",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.9,
"r_y0": 106.3,
"r_x1": 180.0,
"r_y1": 106.3,
"r_x2": 180.0,
"r_y2": 100.6,
"r_x3": 143.9,
"r_y3": 100.6,
"coord_origin": "TOPLEFT"
},
"text": "Standardized",
"orig": "Standardized",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 151.9,
"r_y0": 113.5,
"r_x1": 172.0,
"r_y1": 113.5,
"r_x2": 172.0,
"r_y2": 107.7,
"r_x3": 151.9,
"r_y3": 107.7,
"coord_origin": "TOPLEFT"
},
"text": "Images",
"orig": "Images",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 251.8,
"r_y0": 86.7,
"r_x1": 266.4,
"r_y1": 86.7,
"r_x2": 266.4,
"r_y2": 80.9,
"r_x3": 251.8,
"r_y3": 80.9,
"coord_origin": "TOPLEFT"
},
"text": "BBox",
"orig": "BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 247.5,
"r_y0": 91.8,
"r_x1": 270.7,
"r_y1": 91.8,
"r_x2": 270.7,
"r_y2": 86.0,
"r_x3": 247.5,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "Decoder",
"orig": "Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.0,
"r_y0": 84.3,
"r_x1": 352.1,
"r_y1": 84.3,
"r_x2": 352.1,
"r_y2": 78.6,
"r_x3": 331.0,
"r_y3": 78.6,
"coord_origin": "TOPLEFT"
},
"text": "BBoxes",
"orig": "BBoxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 390.6,
"r_y0": 101.8,
"r_x1": 431.7,
"r_y1": 101.8,
"r_x2": 431.7,
"r_y2": 96.0,
"r_x3": 390.6,
"r_y3": 96.0,
"coord_origin": "TOPLEFT"
},
"text": "BBoxes can be",
"orig": "BBoxes can be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 386.8,
"r_y0": 107.9,
"r_x1": 435.5,
"r_y1": 107.9,
"r_x2": 435.5,
"r_y2": 102.2,
"r_x3": 386.8,
"r_y3": 102.2,
"coord_origin": "TOPLEFT"
},
"text": "traced back to the",
"orig": "traced back to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 388.7,
"r_y0": 114.0,
"r_x1": 433.6,
"r_y1": 114.0,
"r_x2": 433.6,
"r_y2": 108.3,
"r_x3": 388.7,
"r_y3": 108.3,
"coord_origin": "TOPLEFT"
},
"text": "original image to",
"orig": "original image to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.1,
"r_y0": 120.1,
"r_x1": 431.2,
"r_y1": 120.1,
"r_x2": 431.2,
"r_y2": 114.4,
"r_x3": 391.1,
"r_y3": 114.4,
"coord_origin": "TOPLEFT"
},
"text": "extract content",
"orig": "extract content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.2,
"r_y0": 157.4,
"r_x1": 498.8,
"r_y1": 157.4,
"r_x2": 498.8,
"r_y2": 151.7,
"r_x3": 431.2,
"r_y3": 151.7,
"coord_origin": "TOPLEFT"
},
"text": "Structure Tags sequence",
"orig": "Structure Tags sequence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.2,
"r_y0": 163.5,
"r_x1": 498.9,
"r_y1": 163.5,
"r_x2": 498.9,
"r_y2": 157.8,
"r_x3": 431.2,
"r_y3": 157.8,
"coord_origin": "TOPLEFT"
},
"text": "provide full description of",
"orig": "provide full description of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.5,
"r_y0": 169.7,
"r_x1": 489.5,
"r_y1": 169.7,
"r_x2": 489.5,
"r_y2": 163.9,
"r_x3": 440.5,
"r_y3": 163.9,
"coord_origin": "TOPLEFT"
},
"text": "the table structure",
"orig": "the table structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.4,
"r_y0": 184.0,
"r_x1": 367.7,
"r_y1": 184.0,
"r_x2": 367.7,
"r_y2": 178.3,
"r_x3": 328.4,
"r_y3": 178.3,
"coord_origin": "TOPLEFT"
},
"text": "Structure Tags",
"orig": "Structure Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.8,
"r_y0": 129.6,
"r_x1": 373.7,
"r_y1": 129.6,
"r_x2": 373.7,
"r_y2": 123.9,
"r_x3": 331.8,
"r_y3": 123.9,
"coord_origin": "TOPLEFT"
},
"text": "BBoxes in sync",
"orig": "BBoxes in sync",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.8,
"r_y0": 134.7,
"r_x1": 381.2,
"r_y1": 134.7,
"r_x2": 381.2,
"r_y2": 129.0,
"r_x3": 331.8,
"r_y3": 129.0,
"coord_origin": "TOPLEFT"
},
"text": "with tag sequence",
"orig": "with tag sequence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.6,
"r_y0": 93.9,
"r_x1": 219.4,
"r_y1": 93.9,
"r_x2": 219.4,
"r_y2": 88.1,
"r_x3": 196.6,
"r_y3": 88.1,
"coord_origin": "TOPLEFT"
},
"text": "Encoder",
"orig": "Encoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.7,
"r_y0": 135.2,
"r_x1": 271.5,
"r_y1": 135.2,
"r_x2": 271.5,
"r_y2": 129.5,
"r_x3": 246.7,
"r_y3": 129.5,
"coord_origin": "TOPLEFT"
},
"text": "Structure",
"orig": "Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 247.5,
"r_y0": 140.3,
"r_x1": 270.7,
"r_y1": 140.3,
"r_x2": 270.7,
"r_y2": 134.6,
"r_x3": 247.5,
"r_y3": 134.6,
"coord_origin": "TOPLEFT"
},
"text": "Decoder",
"orig": "Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.6,
"r_y0": 94.8,
"r_x1": 365.6,
"r_y1": 94.8,
"r_x2": 365.6,
"r_y2": 89.0,
"r_x3": 330.6,
"r_y3": 89.0,
"coord_origin": "TOPLEFT"
},
"text": "[x1, y2, x2, y2]",
"orig": "[x1, y2, x2, y2]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.6,
"r_y0": 102.9,
"r_x1": 370.2,
"r_y1": 102.9,
"r_x2": 370.2,
"r_y2": 97.2,
"r_x3": 330.6,
"r_y3": 97.2,
"coord_origin": "TOPLEFT"
},
"text": "[x1', y2', x2', y2']",
"orig": "[x1', y2', x2', y2']",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.6,
"r_y0": 111.1,
"r_x1": 374.5,
"r_y1": 111.1,
"r_x2": 374.5,
"r_y2": 105.3,
"r_x3": 330.6,
"r_y3": 105.3,
"coord_origin": "TOPLEFT"
},
"text": "[x1'', y2'', x2'', y2'']",
"orig": "[x1'', y2'', x2'', y2'']",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.6,
"r_y0": 119.2,
"r_x1": 335.7,
"r_y1": 119.2,
"r_x2": 335.7,
"r_y2": 113.5,
"r_x3": 330.6,
"r_y3": 113.5,
"coord_origin": "TOPLEFT"
},
"text": "...",
"orig": "...",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 322.3,
"r_y0": 146.6,
"r_x1": 335.1,
"r_y1": 146.6,
"r_x2": 335.1,
"r_y2": 141.8,
"r_x3": 322.3,
"r_y3": 141.8,
"coord_origin": "TOPLEFT"
},
"text": "
",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 322.3,
"t": 163.2,
"r": 335.1,
"b": 168.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 322.3,
"r_y0": 168.0,
"r_x1": 335.1,
"r_y1": 168.0,
"r_x2": 335.1,
"r_y2": 163.2,
"r_x3": 322.3,
"r_y3": 163.2,
"coord_origin": "TOPLEFT"
},
"text": "",
"orig": " | ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 343.6,
"t": 163.2,
"r": 374.7,
"b": 168.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 343.6,
"r_y0": 168.0,
"r_x1": 374.7,
"r_y1": 168.0,
"r_x2": 374.7,
"r_y2": 163.2,
"r_x3": 343.6,
"r_y3": 163.2,
"coord_origin": "TOPLEFT"
},
"text": " | ...",
"orig": " | ...",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 322.3,
"t": 170.4,
"r": 326.6,
"b": 175.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 322.3,
"r_y0": 175.1,
"r_x1": 326.6,
"r_y1": 175.1,
"r_x2": 326.6,
"r_y2": 170.4,
"r_x3": 322.3,
"r_y3": 170.4,
"coord_origin": "TOPLEFT"
},
"text": "...",
"orig": "...",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 323.5,
"t": 89.7,
"r": 326.9,
"b": 95.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 323.5,
"r_y0": 95.4,
"r_x1": 326.9,
"r_y1": 95.4,
"r_x2": 326.9,
"r_y2": 89.7,
"r_x3": 323.5,
"r_y3": 89.7,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 323.7,
"t": 97.8,
"r": 327.1,
"b": 103.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 323.7,
"r_y0": 103.5,
"r_x1": 327.1,
"r_y1": 103.5,
"r_x2": 327.1,
"r_y2": 97.8,
"r_x3": 323.7,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 323.7,
"t": 106.0,
"r": 327.1,
"b": 111.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 323.7,
"r_y0": 111.7,
"r_x1": 327.1,
"r_y1": 111.7,
"r_x2": 327.1,
"r_y2": 106.0,
"r_x3": 323.7,
"r_y3": 106.0,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 401.5,
"t": 148.5,
"r": 404.9,
"b": 154.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 401.5,
"r_y0": 154.3,
"r_x1": 404.9,
"r_y1": 154.3,
"r_x2": 404.9,
"r_y2": 148.5,
"r_x3": 401.5,
"r_y3": 148.5,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 337.7,
"t": 162.7,
"r": 341.1,
"b": 168.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 337.7,
"r_y0": 168.4,
"r_x1": 341.1,
"r_y1": 168.4,
"r_x2": 341.1,
"r_y2": 162.7,
"r_x3": 337.7,
"r_y3": 162.7,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 454.5,
"t": 104.5,
"r": 457.9,
"b": 110.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 454.5,
"r_y0": 110.3,
"r_x1": 457.9,
"r_y1": 110.3,
"r_x2": 457.9,
"r_y2": 104.5,
"r_x3": 454.5,
"r_y3": 104.5,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 493.3,
"t": 91.1,
"r": 496.7,
"b": 96.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.3,
"r_y0": 96.8,
"r_x1": 496.7,
"r_y1": 96.8,
"r_x2": 496.7,
"r_y2": 91.1,
"r_x3": 493.3,
"r_y3": 91.1,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 454.1,
"t": 90.6,
"r": 457.5,
"b": 96.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 454.1,
"r_y0": 96.3,
"r_x1": 457.5,
"r_y1": 96.3,
"r_x2": 457.5,
"r_y2": 90.6,
"r_x3": 454.1,
"r_y3": 90.6,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "caption",
"id": 6,
"page_no": 4,
"cluster": {
"id": 6,
"label": "caption",
"bbox": {
"l": 50.1,
"t": 204.0,
"r": 545.1,
"b": 225.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 213.0,
"r_x1": 86.9,
"r_y1": 213.0,
"r_x2": 86.9,
"r_y2": 204.1,
"r_x3": 50.1,
"r_y3": 204.1,
"coord_origin": "TOPLEFT"
},
"text": "Figure 3:",
"orig": "Figure 3:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 94.0,
"r_y0": 212.9,
"r_x1": 149.9,
"r_y1": 212.9,
"r_x2": 149.9,
"r_y2": 204.0,
"r_x3": 94.0,
"r_y3": 204.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 152.9,
"r_y0": 213.0,
"r_x1": 545.1,
"r_y1": 213.0,
"r_x2": 545.1,
"r_y2": 204.1,
"r_x3": 152.9,
"r_y3": 204.1,
"coord_origin": "TOPLEFT"
},
"text": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are",
"orig": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 225.0,
"r_x1": 436.0,
"r_y1": 225.0,
"r_x2": 436.0,
"r_y2": 216.1,
"r_x3": 50.1,
"r_y3": 216.1,
"coord_origin": "TOPLEFT"
},
"text": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.",
"orig": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 3: TableFormer takes in an image of the PDF and creates bounding box and HTML structure predictions that are synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure."
},
{
"label": "picture",
"id": 5,
"page_no": 4,
"cluster": {
"id": 5,
"label": "picture",
"bbox": {
"l": 53.0,
"t": 257.7,
"r": 285.4,
"b": 507.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.3,
"r_y0": 264.2,
"r_x1": 101.8,
"r_y1": 264.2,
"r_x2": 101.8,
"r_y2": 258.2,
"r_x3": 74.3,
"r_y3": 258.2,
"coord_origin": "TOPLEFT"
},
"text": "Input Image",
"orig": "Input Image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.3,
"r_y0": 264.3,
"r_x1": 157.8,
"r_y1": 264.3,
"r_x2": 157.8,
"r_y2": 258.3,
"r_x3": 122.3,
"r_y3": 258.3,
"coord_origin": "TOPLEFT"
},
"text": "Tokenised Tags",
"orig": "Tokenised Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.5,
"r_y0": 377.0,
"r_x1": 125.7,
"r_y1": 377.0,
"r_x2": 125.7,
"r_y2": 371.4,
"r_x3": 78.5,
"r_y3": 371.4,
"coord_origin": "TOPLEFT"
},
"text": "Multi-Head Attention",
"orig": "Multi-Head Attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.5,
"r_y0": 397.0,
"r_x1": 84.6,
"r_y1": 397.0,
"r_x2": 84.6,
"r_y2": 391.3,
"r_x3": 78.5,
"r_y3": 391.3,
"coord_origin": "TOPLEFT"
},
"text": "Add",
"orig": "Add",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.5,
"r_y0": 397.0,
"r_x1": 125.1,
"r_y1": 397.0,
"r_x2": 125.1,
"r_y2": 391.3,
"r_x3": 116.5,
"r_y3": 391.3,
"coord_origin": "TOPLEFT"
},
"text": "& Normalisation",
"orig": "& Normalisation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.0,
"r_y0": 430.1,
"r_x1": 127.9,
"r_y1": 430.1,
"r_x2": 127.9,
"r_y2": 424.5,
"r_x3": 76.0,
"r_y3": 424.5,
"coord_origin": "TOPLEFT"
},
"text": "Feed Forward Network",
"orig": "Feed Forward Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.4,
"r_y0": 450.6,
"r_x1": 84.5,
"r_y1": 450.6,
"r_x2": 84.5,
"r_y2": 444.9,
"r_x3": 78.4,
"r_y3": 444.9,
"coord_origin": "TOPLEFT"
},
"text": "Add",
"orig": "Add",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.4,
"r_y0": 450.6,
"r_x1": 125.0,
"r_y1": 450.6,
"r_x2": 125.0,
"r_y2": 444.9,
"r_x3": 116.4,
"r_y3": 444.9,
"coord_origin": "TOPLEFT"
},
"text": "& Normalisation",
"orig": "& Normalisation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 167.5,
"r_y0": 468.1,
"r_x1": 181.6,
"r_y1": 468.1,
"r_x2": 181.6,
"r_y2": 462.4,
"r_x3": 167.5,
"r_y3": 462.4,
"coord_origin": "TOPLEFT"
},
"text": "Linear",
"orig": "Linear",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 165.6,
"r_y0": 484.1,
"r_x1": 184.4,
"r_y1": 484.1,
"r_x2": 184.4,
"r_y2": 478.5,
"r_x3": 165.6,
"r_y3": 478.5,
"coord_origin": "TOPLEFT"
},
"text": "Softmax",
"orig": "Softmax",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.3,
"r_y0": 330.2,
"r_x1": 132.9,
"r_y1": 330.2,
"r_x2": 132.9,
"r_y2": 324.3,
"r_x3": 65.3,
"r_y3": 324.3,
"coord_origin": "TOPLEFT"
},
"text": "CNN BACKBONE ENCODER",
"orig": "CNN BACKBONE ENCODER",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.5,
"r_y0": 274.7,
"r_x1": 163.0,
"r_y1": 274.7,
"r_x2": 163.0,
"r_y2": 269.7,
"r_x3": 119.5,
"r_y3": 269.7,
"coord_origin": "TOPLEFT"
},
"text": "[30, 1, 2, 3, 4, \u2026 3, ",
"orig": "[30, 1, 2, 3, 4, \u2026 3, ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 128.7,
"r_y0": 280.0,
"r_x1": 151.4,
"r_y1": 280.0,
"r_x2": 151.4,
"r_y2": 274.9,
"r_x3": 128.7,
"r_y3": 274.9,
"coord_origin": "TOPLEFT"
},
"text": "4, 5, 8, 31]",
"orig": "4, 5, 8, 31]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.4,
"r_y0": 344.3,
"r_x1": 80.3,
"r_y1": 344.3,
"r_x2": 80.3,
"r_y2": 339.0,
"r_x3": 60.4,
"r_y3": 339.0,
"coord_origin": "TOPLEFT"
},
"text": "Positional ",
"orig": "Positional ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.6,
"r_y0": 348.7,
"r_x1": 78.9,
"r_y1": 348.7,
"r_x2": 78.9,
"r_y2": 343.4,
"r_x3": 60.6,
"r_y3": 343.4,
"coord_origin": "TOPLEFT"
},
"text": "Encoding",
"orig": "Encoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.8,
"r_y0": 298.7,
"r_x1": 154.7,
"r_y1": 298.7,
"r_x2": 154.7,
"r_y2": 293.4,
"r_x3": 134.8,
"r_y3": 293.4,
"coord_origin": "TOPLEFT"
},
"text": "Positional ",
"orig": "Positional ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 135.0,
"r_y0": 303.1,
"r_x1": 153.2,
"r_y1": 303.1,
"r_x2": 153.2,
"r_y2": 297.8,
"r_x3": 135.0,
"r_y3": 297.8,
"coord_origin": "TOPLEFT"
},
"text": "Encoding",
"orig": "Encoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 150.6,
"r_y0": 351.0,
"r_x1": 197.1,
"r_y1": 351.0,
"r_x2": 197.1,
"r_y2": 345.4,
"r_x3": 150.6,
"r_y3": 345.4,
"coord_origin": "TOPLEFT"
},
"text": "Add & Normalisation",
"orig": "Add & Normalisation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 150.6,
"r_y0": 400.1,
"r_x1": 156.7,
"r_y1": 400.1,
"r_x2": 156.7,
"r_y2": 394.4,
"r_x3": 150.6,
"r_y3": 394.4,
"coord_origin": "TOPLEFT"
},
"text": "Add",
"orig": "Add",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.6,
"r_y0": 400.1,
"r_x1": 197.1,
"r_y1": 400.1,
"r_x2": 197.1,
"r_y2": 394.4,
"r_x3": 188.6,
"r_y3": 394.4,
"coord_origin": "TOPLEFT"
},
"text": "& Normalisation",
"orig": "& Normalisation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 150.2,
"r_y0": 381.3,
"r_x1": 197.3,
"r_y1": 381.3,
"r_x2": 197.3,
"r_y2": 375.7,
"r_x3": 150.2,
"r_y3": 375.7,
"coord_origin": "TOPLEFT"
},
"text": "Multi-Head Attention",
"orig": "Multi-Head Attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 150.6,
"r_y0": 445.9,
"r_x1": 156.7,
"r_y1": 445.9,
"r_x2": 156.7,
"r_y2": 440.2,
"r_x3": 150.6,
"r_y3": 440.2,
"coord_origin": "TOPLEFT"
},
"text": "Add",
"orig": "Add",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.6,
"r_y0": 445.9,
"r_x1": 197.1,
"r_y1": 445.9,
"r_x2": 197.1,
"r_y2": 440.2,
"r_x3": 188.6,
"r_y3": 440.2,
"coord_origin": "TOPLEFT"
},
"text": "& Normalisation",
"orig": "& Normalisation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 147.9,
"r_y0": 427.8,
"r_x1": 199.8,
"r_y1": 427.8,
"r_x2": 199.8,
"r_y2": 422.1,
"r_x3": 147.9,
"r_y3": 422.1,
"coord_origin": "TOPLEFT"
},
"text": "Feed Forward Network",
"orig": "Feed Forward Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.6,
"r_y0": 319.9,
"r_x1": 255.7,
"r_y1": 319.9,
"r_x2": 255.7,
"r_y2": 314.3,
"r_x3": 241.6,
"r_y3": 314.3,
"coord_origin": "TOPLEFT"
},
"text": "Linear",
"orig": "Linear",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.9,
"r_y0": 367.0,
"r_x1": 256.1,
"r_y1": 367.0,
"r_x2": 256.1,
"r_y2": 361.4,
"r_x3": 241.9,
"r_y3": 361.4,
"coord_origin": "TOPLEFT"
},
"text": "Linear",
"orig": "Linear",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 228.1,
"r_y0": 342.3,
"r_x1": 248.7,
"r_y1": 342.3,
"r_x2": 248.7,
"r_y2": 336.6,
"r_x3": 228.1,
"r_y3": 336.6,
"coord_origin": "TOPLEFT"
},
"text": "Attention",
"orig": "Attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.3,
"r_y0": 342.3,
"r_x1": 269.4,
"r_y1": 342.3,
"r_x2": 269.4,
"r_y2": 336.6,
"r_x3": 246.3,
"r_y3": 336.6,
"coord_origin": "TOPLEFT"
},
"text": "Network",
"orig": "Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 228.4,
"r_y0": 410.8,
"r_x1": 238.7,
"r_y1": 410.8,
"r_x2": 238.7,
"r_y2": 405.1,
"r_x3": 228.4,
"r_y3": 405.1,
"coord_origin": "TOPLEFT"
},
"text": "MLP",
"orig": "MLP",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.3,
"r_y0": 410.9,
"r_x1": 271.8,
"r_y1": 410.9,
"r_x2": 271.8,
"r_y2": 405.2,
"r_x3": 256.3,
"r_y3": 405.2,
"coord_origin": "TOPLEFT"
},
"text": "Linear ",
"orig": "Linear ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.5,
"r_y0": 387.9,
"r_x1": 258.1,
"r_y1": 387.9,
"r_x2": 258.1,
"r_y2": 382.2,
"r_x3": 239.5,
"r_y3": 382.2,
"coord_origin": "TOPLEFT"
},
"text": "Sigmoid",
"orig": "Sigmoid",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.1,
"r_y0": 449.8,
"r_x1": 59.5,
"r_y1": 449.8,
"r_x2": 59.5,
"r_y2": 384.9,
"r_x3": 54.1,
"r_y3": 384.9,
"coord_origin": "TOPLEFT"
},
"text": "Transformer Encoder Network",
"orig": "Transformer Encoder Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.2,
"r_y0": 378.5,
"r_x1": 59.3,
"r_y1": 378.5,
"r_x2": 59.3,
"r_y2": 373.8,
"r_x3": 54.2,
"r_y3": 373.8,
"coord_origin": "TOPLEFT"
},
"text": "x2",
"orig": "x2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 85.3,
"r_y0": 490.4,
"r_x1": 122.2,
"r_y1": 490.4,
"r_x2": 122.2,
"r_y2": 484.5,
"r_x3": 85.3,
"r_y3": 484.5,
"coord_origin": "TOPLEFT"
},
"text": "Encoded Output",
"orig": "Encoded Output",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.7,
"r_y0": 285.5,
"r_x1": 265.3,
"r_y1": 285.5,
"r_x2": 265.3,
"r_y2": 279.5,
"r_x3": 229.7,
"r_y3": 279.5,
"coord_origin": "TOPLEFT"
},
"text": "Encoded Output",
"orig": "Encoded Output",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 157.2,
"r_y0": 506.1,
"r_x1": 190.4,
"r_y1": 506.1,
"r_x2": 190.4,
"r_y2": 500.3,
"r_x3": 157.2,
"r_y3": 500.3,
"coord_origin": "TOPLEFT"
},
"text": "Predicted Tags",
"orig": "Predicted Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.8,
"r_y0": 443.9,
"r_x1": 270.8,
"r_y1": 443.9,
"r_x2": 270.8,
"r_y2": 438.1,
"r_x3": 227.8,
"r_y3": 438.1,
"coord_origin": "TOPLEFT"
},
"text": "Bounding Boxes & ",
"orig": "Bounding Boxes & ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.7,
"r_y0": 449.9,
"r_x1": 263.5,
"r_y1": 449.9,
"r_x2": 263.5,
"r_y2": 444.1,
"r_x3": 233.7,
"r_y3": 444.1,
"coord_origin": "TOPLEFT"
},
"text": "Classification",
"orig": "Classification",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.7,
"r_y0": 298.8,
"r_x1": 212.2,
"r_y1": 298.8,
"r_x2": 212.2,
"r_y2": 293.4,
"r_x3": 184.7,
"r_y3": 293.4,
"coord_origin": "TOPLEFT"
},
"text": "Transformer ",
"orig": "Transformer ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 178.9,
"r_y0": 304.5,
"r_x1": 216.7,
"r_y1": 304.5,
"r_x2": 216.7,
"r_y2": 299.1,
"r_x3": 178.9,
"r_y3": 299.1,
"coord_origin": "TOPLEFT"
},
"text": "Decoder Network",
"orig": "Decoder Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 194.2,
"r_y0": 287.8,
"r_x1": 198.9,
"r_y1": 287.8,
"r_x2": 198.9,
"r_y2": 282.8,
"r_x3": 194.2,
"r_y3": 282.8,
"coord_origin": "TOPLEFT"
},
"text": "x4",
"orig": "x4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 221.5,
"r_y0": 277.8,
"r_x1": 276.5,
"r_y1": 277.8,
"r_x2": 276.5,
"r_y2": 271.9,
"r_x3": 221.5,
"r_y3": 271.9,
"coord_origin": "TOPLEFT"
},
"text": "CELL BBOX DECODER",
"orig": "CELL BBOX DECODER",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 151.7,
"r_y0": 329.1,
"r_x1": 197.3,
"r_y1": 329.1,
"r_x2": 197.3,
"r_y2": 323.4,
"r_x3": 151.7,
"r_y3": 323.4,
"coord_origin": "TOPLEFT"
},
"text": "Masked Multi-Head ",
"orig": "Masked Multi-Head ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 163.4,
"r_y0": 335.1,
"r_x1": 184.2,
"r_y1": 335.1,
"r_x2": 184.2,
"r_y2": 329.4,
"r_x3": 163.4,
"r_y3": 329.4,
"coord_origin": "TOPLEFT"
},
"text": "Attention",
"orig": "Attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 70,
"label": "text",
"bbox": {
"l": 74.3,
"t": 258.2,
"r": 101.8,
"b": 264.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.3,
"r_y0": 264.2,
"r_x1": 101.8,
"r_y1": 264.2,
"r_x2": 101.8,
"r_y2": 258.2,
"r_x3": 74.3,
"r_y3": 258.2,
"coord_origin": "TOPLEFT"
},
"text": "Input Image",
"orig": "Input Image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 122.3,
"t": 258.3,
"r": 157.8,
"b": 264.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.3,
"r_y0": 264.3,
"r_x1": 157.8,
"r_y1": 264.3,
"r_x2": 157.8,
"r_y2": 258.3,
"r_x3": 122.3,
"r_y3": 258.3,
"coord_origin": "TOPLEFT"
},
"text": "Tokenised Tags",
"orig": "Tokenised Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 78.5,
"t": 371.4,
"r": 125.7,
"b": 377.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.5,
"r_y0": 377.0,
"r_x1": 125.7,
"r_y1": 377.0,
"r_x2": 125.7,
"r_y2": 371.4,
"r_x3": 78.5,
"r_y3": 371.4,
"coord_origin": "TOPLEFT"
},
"text": "Multi-Head Attention",
"orig": "Multi-Head Attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 78.5,
"t": 391.3,
"r": 84.6,
"b": 397.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.5,
"r_y0": 397.0,
"r_x1": 84.6,
"r_y1": 397.0,
"r_x2": 84.6,
"r_y2": 391.3,
"r_x3": 78.5,
"r_y3": 391.3,
"coord_origin": "TOPLEFT"
},
"text": "Add",
"orig": "Add",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 116.5,
"t": 391.3,
"r": 125.1,
"b": 397.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.5,
"r_y0": 397.0,
"r_x1": 125.1,
"r_y1": 397.0,
"r_x2": 125.1,
"r_y2": 391.3,
"r_x3": 116.5,
"r_y3": 391.3,
"coord_origin": "TOPLEFT"
},
"text": "& Normalisation",
"orig": "& Normalisation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 76.0,
"t": 424.5,
"r": 127.9,
"b": 430.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.0,
"r_y0": 430.1,
"r_x1": 127.9,
"r_y1": 430.1,
"r_x2": 127.9,
"r_y2": 424.5,
"r_x3": 76.0,
"r_y3": 424.5,
"coord_origin": "TOPLEFT"
},
"text": "Feed Forward Network",
"orig": "Feed Forward Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 78.4,
"t": 444.9,
"r": 84.5,
"b": 450.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.4,
"r_y0": 450.6,
"r_x1": 84.5,
"r_y1": 450.6,
"r_x2": 84.5,
"r_y2": 444.9,
"r_x3": 78.4,
"r_y3": 444.9,
"coord_origin": "TOPLEFT"
},
"text": "Add",
"orig": "Add",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 116.4,
"t": 444.9,
"r": 125.0,
"b": 450.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.4,
"r_y0": 450.6,
"r_x1": 125.0,
"r_y1": 450.6,
"r_x2": 125.0,
"r_y2": 444.9,
"r_x3": 116.4,
"r_y3": 444.9,
"coord_origin": "TOPLEFT"
},
"text": "& Normalisation",
"orig": "& Normalisation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 167.5,
"t": 462.4,
"r": 181.6,
"b": 468.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 167.5,
"r_y0": 468.1,
"r_x1": 181.6,
"r_y1": 468.1,
"r_x2": 181.6,
"r_y2": 462.4,
"r_x3": 167.5,
"r_y3": 462.4,
"coord_origin": "TOPLEFT"
},
"text": "Linear",
"orig": "Linear",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 165.6,
"t": 478.5,
"r": 184.4,
"b": 484.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 165.6,
"r_y0": 484.1,
"r_x1": 184.4,
"r_y1": 484.1,
"r_x2": 184.4,
"r_y2": 478.5,
"r_x3": 165.6,
"r_y3": 478.5,
"coord_origin": "TOPLEFT"
},
"text": "Softmax",
"orig": "Softmax",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 65.3,
"t": 324.3,
"r": 132.9,
"b": 330.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.3,
"r_y0": 330.2,
"r_x1": 132.9,
"r_y1": 330.2,
"r_x2": 132.9,
"r_y2": 324.3,
"r_x3": 65.3,
"r_y3": 324.3,
"coord_origin": "TOPLEFT"
},
"text": "CNN BACKBONE ENCODER",
"orig": "CNN BACKBONE ENCODER",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 119.5,
"t": 269.7,
"r": 163.0,
"b": 274.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.5,
"r_y0": 274.7,
"r_x1": 163.0,
"r_y1": 274.7,
"r_x2": 163.0,
"r_y2": 269.7,
"r_x3": 119.5,
"r_y3": 269.7,
"coord_origin": "TOPLEFT"
},
"text": "[30, 1, 2, 3, 4, \u2026 3, ",
"orig": "[30, 1, 2, 3, 4, \u2026 3, ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 128.7,
"t": 274.9,
"r": 151.4,
"b": 280.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 128.7,
"r_y0": 280.0,
"r_x1": 151.4,
"r_y1": 280.0,
"r_x2": 151.4,
"r_y2": 274.9,
"r_x3": 128.7,
"r_y3": 274.9,
"coord_origin": "TOPLEFT"
},
"text": "4, 5, 8, 31]",
"orig": "4, 5, 8, 31]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 83,
"label": "text",
"bbox": {
"l": 60.4,
"t": 339.0,
"r": 80.3,
"b": 344.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.4,
"r_y0": 344.3,
"r_x1": 80.3,
"r_y1": 344.3,
"r_x2": 80.3,
"r_y2": 339.0,
"r_x3": 60.4,
"r_y3": 339.0,
"coord_origin": "TOPLEFT"
},
"text": "Positional ",
"orig": "Positional ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 60.6,
"t": 343.4,
"r": 78.9,
"b": 348.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.6,
"r_y0": 348.7,
"r_x1": 78.9,
"r_y1": 348.7,
"r_x2": 78.9,
"r_y2": 343.4,
"r_x3": 60.6,
"r_y3": 343.4,
"coord_origin": "TOPLEFT"
},
"text": "Encoding",
"orig": "Encoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 134.8,
"t": 293.4,
"r": 154.7,
"b": 298.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.8,
"r_y0": 298.7,
"r_x1": 154.7,
"r_y1": 298.7,
"r_x2": 154.7,
"r_y2": 293.4,
"r_x3": 134.8,
"r_y3": 293.4,
"coord_origin": "TOPLEFT"
},
"text": "Positional ",
"orig": "Positional ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 135.0,
"t": 297.8,
"r": 153.2,
"b": 303.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 135.0,
"r_y0": 303.1,
"r_x1": 153.2,
"r_y1": 303.1,
"r_x2": 153.2,
"r_y2": 297.8,
"r_x3": 135.0,
"r_y3": 297.8,
"coord_origin": "TOPLEFT"
},
"text": "Encoding",
"orig": "Encoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 150.6,
"t": 345.4,
"r": 197.1,
"b": 351.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 150.6,
"r_y0": 351.0,
"r_x1": 197.1,
"r_y1": 351.0,
"r_x2": 197.1,
"r_y2": 345.4,
"r_x3": 150.6,
"r_y3": 345.4,
"coord_origin": "TOPLEFT"
},
"text": "Add & Normalisation",
"orig": "Add & Normalisation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 150.6,
"t": 394.4,
"r": 156.7,
"b": 400.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 150.6,
"r_y0": 400.1,
"r_x1": 156.7,
"r_y1": 400.1,
"r_x2": 156.7,
"r_y2": 394.4,
"r_x3": 150.6,
"r_y3": 394.4,
"coord_origin": "TOPLEFT"
},
"text": "Add",
"orig": "Add",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 188.6,
"t": 394.4,
"r": 197.1,
"b": 400.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.6,
"r_y0": 400.1,
"r_x1": 197.1,
"r_y1": 400.1,
"r_x2": 197.1,
"r_y2": 394.4,
"r_x3": 188.6,
"r_y3": 394.4,
"coord_origin": "TOPLEFT"
},
"text": "& Normalisation",
"orig": "& Normalisation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 150.2,
"t": 375.7,
"r": 197.3,
"b": 381.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 150.2,
"r_y0": 381.3,
"r_x1": 197.3,
"r_y1": 381.3,
"r_x2": 197.3,
"r_y2": 375.7,
"r_x3": 150.2,
"r_y3": 375.7,
"coord_origin": "TOPLEFT"
},
"text": "Multi-Head Attention",
"orig": "Multi-Head Attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 150.6,
"t": 440.2,
"r": 156.7,
"b": 445.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 150.6,
"r_y0": 445.9,
"r_x1": 156.7,
"r_y1": 445.9,
"r_x2": 156.7,
"r_y2": 440.2,
"r_x3": 150.6,
"r_y3": 440.2,
"coord_origin": "TOPLEFT"
},
"text": "Add",
"orig": "Add",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 188.6,
"t": 440.2,
"r": 197.1,
"b": 445.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.6,
"r_y0": 445.9,
"r_x1": 197.1,
"r_y1": 445.9,
"r_x2": 197.1,
"r_y2": 440.2,
"r_x3": 188.6,
"r_y3": 440.2,
"coord_origin": "TOPLEFT"
},
"text": "& Normalisation",
"orig": "& Normalisation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 147.9,
"t": 422.1,
"r": 199.8,
"b": 427.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 147.9,
"r_y0": 427.8,
"r_x1": 199.8,
"r_y1": 427.8,
"r_x2": 199.8,
"r_y2": 422.1,
"r_x3": 147.9,
"r_y3": 422.1,
"coord_origin": "TOPLEFT"
},
"text": "Feed Forward Network",
"orig": "Feed Forward Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 241.6,
"t": 314.3,
"r": 255.7,
"b": 319.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.6,
"r_y0": 319.9,
"r_x1": 255.7,
"r_y1": 319.9,
"r_x2": 255.7,
"r_y2": 314.3,
"r_x3": 241.6,
"r_y3": 314.3,
"coord_origin": "TOPLEFT"
},
"text": "Linear",
"orig": "Linear",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 241.9,
"t": 361.4,
"r": 256.1,
"b": 367.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.9,
"r_y0": 367.0,
"r_x1": 256.1,
"r_y1": 367.0,
"r_x2": 256.1,
"r_y2": 361.4,
"r_x3": 241.9,
"r_y3": 361.4,
"coord_origin": "TOPLEFT"
},
"text": "Linear",
"orig": "Linear",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 228.1,
"t": 336.6,
"r": 248.7,
"b": 342.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 228.1,
"r_y0": 342.3,
"r_x1": 248.7,
"r_y1": 342.3,
"r_x2": 248.7,
"r_y2": 336.6,
"r_x3": 228.1,
"r_y3": 336.6,
"coord_origin": "TOPLEFT"
},
"text": "Attention",
"orig": "Attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 246.3,
"t": 336.6,
"r": 269.4,
"b": 342.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.3,
"r_y0": 342.3,
"r_x1": 269.4,
"r_y1": 342.3,
"r_x2": 269.4,
"r_y2": 336.6,
"r_x3": 246.3,
"r_y3": 336.6,
"coord_origin": "TOPLEFT"
},
"text": "Network",
"orig": "Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 228.4,
"t": 405.1,
"r": 238.7,
"b": 410.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 228.4,
"r_y0": 410.8,
"r_x1": 238.7,
"r_y1": 410.8,
"r_x2": 238.7,
"r_y2": 405.1,
"r_x3": 228.4,
"r_y3": 405.1,
"coord_origin": "TOPLEFT"
},
"text": "MLP",
"orig": "MLP",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 99,
"label": "text",
"bbox": {
"l": 256.3,
"t": 405.2,
"r": 271.8,
"b": 410.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.3,
"r_y0": 410.9,
"r_x1": 271.8,
"r_y1": 410.9,
"r_x2": 271.8,
"r_y2": 405.2,
"r_x3": 256.3,
"r_y3": 405.2,
"coord_origin": "TOPLEFT"
},
"text": "Linear ",
"orig": "Linear ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 239.5,
"t": 382.2,
"r": 258.1,
"b": 387.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.5,
"r_y0": 387.9,
"r_x1": 258.1,
"r_y1": 387.9,
"r_x2": 258.1,
"r_y2": 382.2,
"r_x3": 239.5,
"r_y3": 382.2,
"coord_origin": "TOPLEFT"
},
"text": "Sigmoid",
"orig": "Sigmoid",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 54.1,
"t": 384.9,
"r": 59.5,
"b": 449.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.1,
"r_y0": 449.8,
"r_x1": 59.5,
"r_y1": 449.8,
"r_x2": 59.5,
"r_y2": 384.9,
"r_x3": 54.1,
"r_y3": 384.9,
"coord_origin": "TOPLEFT"
},
"text": "Transformer Encoder Network",
"orig": "Transformer Encoder Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 54.2,
"t": 373.8,
"r": 59.3,
"b": 378.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.2,
"r_y0": 378.5,
"r_x1": 59.3,
"r_y1": 378.5,
"r_x2": 59.3,
"r_y2": 373.8,
"r_x3": 54.2,
"r_y3": 373.8,
"coord_origin": "TOPLEFT"
},
"text": "x2",
"orig": "x2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 85.3,
"t": 484.5,
"r": 122.2,
"b": 490.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 85.3,
"r_y0": 490.4,
"r_x1": 122.2,
"r_y1": 490.4,
"r_x2": 122.2,
"r_y2": 484.5,
"r_x3": 85.3,
"r_y3": 484.5,
"coord_origin": "TOPLEFT"
},
"text": "Encoded Output",
"orig": "Encoded Output",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 229.7,
"t": 279.5,
"r": 265.3,
"b": 285.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.7,
"r_y0": 285.5,
"r_x1": 265.3,
"r_y1": 285.5,
"r_x2": 265.3,
"r_y2": 279.5,
"r_x3": 229.7,
"r_y3": 279.5,
"coord_origin": "TOPLEFT"
},
"text": "Encoded Output",
"orig": "Encoded Output",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 105,
"label": "text",
"bbox": {
"l": 157.2,
"t": 500.3,
"r": 190.4,
"b": 506.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 157.2,
"r_y0": 506.1,
"r_x1": 190.4,
"r_y1": 506.1,
"r_x2": 190.4,
"r_y2": 500.3,
"r_x3": 157.2,
"r_y3": 500.3,
"coord_origin": "TOPLEFT"
},
"text": "Predicted Tags",
"orig": "Predicted Tags",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 106,
"label": "text",
"bbox": {
"l": 227.8,
"t": 438.1,
"r": 270.8,
"b": 443.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.8,
"r_y0": 443.9,
"r_x1": 270.8,
"r_y1": 443.9,
"r_x2": 270.8,
"r_y2": 438.1,
"r_x3": 227.8,
"r_y3": 438.1,
"coord_origin": "TOPLEFT"
},
"text": "Bounding Boxes & ",
"orig": "Bounding Boxes & ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 107,
"label": "text",
"bbox": {
"l": 233.7,
"t": 444.1,
"r": 263.5,
"b": 449.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.7,
"r_y0": 449.9,
"r_x1": 263.5,
"r_y1": 449.9,
"r_x2": 263.5,
"r_y2": 444.1,
"r_x3": 233.7,
"r_y3": 444.1,
"coord_origin": "TOPLEFT"
},
"text": "Classification",
"orig": "Classification",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 108,
"label": "text",
"bbox": {
"l": 184.7,
"t": 293.4,
"r": 212.2,
"b": 298.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.7,
"r_y0": 298.8,
"r_x1": 212.2,
"r_y1": 298.8,
"r_x2": 212.2,
"r_y2": 293.4,
"r_x3": 184.7,
"r_y3": 293.4,
"coord_origin": "TOPLEFT"
},
"text": "Transformer ",
"orig": "Transformer ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 109,
"label": "text",
"bbox": {
"l": 178.9,
"t": 299.1,
"r": 216.7,
"b": 304.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 178.9,
"r_y0": 304.5,
"r_x1": 216.7,
"r_y1": 304.5,
"r_x2": 216.7,
"r_y2": 299.1,
"r_x3": 178.9,
"r_y3": 299.1,
"coord_origin": "TOPLEFT"
},
"text": "Decoder Network",
"orig": "Decoder Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 110,
"label": "text",
"bbox": {
"l": 194.2,
"t": 282.8,
"r": 198.9,
"b": 287.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 194.2,
"r_y0": 287.8,
"r_x1": 198.9,
"r_y1": 287.8,
"r_x2": 198.9,
"r_y2": 282.8,
"r_x3": 194.2,
"r_y3": 282.8,
"coord_origin": "TOPLEFT"
},
"text": "x4",
"orig": "x4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 111,
"label": "text",
"bbox": {
"l": 221.5,
"t": 271.9,
"r": 276.5,
"b": 277.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 221.5,
"r_y0": 277.8,
"r_x1": 276.5,
"r_y1": 277.8,
"r_x2": 276.5,
"r_y2": 271.9,
"r_x3": 221.5,
"r_y3": 271.9,
"coord_origin": "TOPLEFT"
},
"text": "CELL BBOX DECODER",
"orig": "CELL BBOX DECODER",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 112,
"label": "text",
"bbox": {
"l": 151.7,
"t": 323.4,
"r": 197.3,
"b": 329.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 151.7,
"r_y0": 329.1,
"r_x1": 197.3,
"r_y1": 329.1,
"r_x2": 197.3,
"r_y2": 323.4,
"r_x3": 151.7,
"r_y3": 323.4,
"coord_origin": "TOPLEFT"
},
"text": "Masked Multi-Head ",
"orig": "Masked Multi-Head ",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 113,
"label": "text",
"bbox": {
"l": 163.4,
"t": 329.4,
"r": 184.2,
"b": 335.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 163.4,
"r_y0": 335.1,
"r_x1": 184.2,
"r_y1": 335.1,
"r_x2": 184.2,
"r_y2": 329.4,
"r_x3": 163.4,
"r_y3": 329.4,
"coord_origin": "TOPLEFT"
},
"text": "Attention",
"orig": "Attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "caption",
"id": 8,
"page_no": 4,
"cluster": {
"id": 8,
"label": "caption",
"bbox": {
"l": 50.1,
"t": 527.8,
"r": 286.4,
"b": 680.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 536.8,
"r_x1": 229.8,
"r_y1": 536.8,
"r_x2": 229.8,
"r_y2": 527.9,
"r_x3": 50.1,
"r_y3": 527.9,
"coord_origin": "TOPLEFT"
},
"text": "Figure 4: Given an input image of a table, the",
"orig": "Figure 4: Given an input image of a table, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 231.8,
"r_y0": 536.7,
"r_x1": 267.8,
"r_y1": 536.7,
"r_x2": 267.8,
"r_y2": 527.8,
"r_x3": 231.8,
"r_y3": 527.8,
"coord_origin": "TOPLEFT"
},
"text": "Encoder",
"orig": "Encoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 269.8,
"r_y0": 536.8,
"r_x1": 286.4,
"r_y1": 536.8,
"r_x2": 286.4,
"r_y2": 527.9,
"r_x3": 269.8,
"r_y3": 527.9,
"coord_origin": "TOPLEFT"
},
"text": "pro-",
"orig": "pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 548.8,
"r_x1": 286.4,
"r_y1": 548.8,
"r_x2": 286.4,
"r_y2": 539.9,
"r_x3": 50.1,
"r_y3": 539.9,
"coord_origin": "TOPLEFT"
},
"text": "duces fixed-length features that represent the input image.",
"orig": "duces fixed-length features that represent the input image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 560.7,
"r_x1": 205.8,
"r_y1": 560.7,
"r_x2": 205.8,
"r_y2": 551.8,
"r_x3": 50.1,
"r_y3": 551.8,
"coord_origin": "TOPLEFT"
},
"text": "The features are then passed to both the",
"orig": "The features are then passed to both the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.0,
"r_y0": 560.7,
"r_x1": 286.4,
"r_y1": 560.7,
"r_x2": 286.4,
"r_y2": 551.7,
"r_x3": 208.0,
"r_y3": 551.7,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 572.7,
"r_x1": 64.5,
"r_y1": 572.7,
"r_x2": 64.5,
"r_y2": 563.8,
"r_x3": 50.1,
"r_y3": 563.8,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.2,
"r_y0": 572.6,
"r_x1": 151.3,
"r_y1": 572.6,
"r_x2": 151.3,
"r_y2": 563.6,
"r_x3": 68.2,
"r_y3": 563.6,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 151.3,
"r_y0": 572.7,
"r_x1": 153.8,
"r_y1": 572.7,
"r_x2": 153.8,
"r_y2": 563.8,
"r_x3": 151.3,
"r_y3": 563.8,
"coord_origin": "TOPLEFT"
},
"text": ".",
"orig": ".",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.4,
"r_y0": 572.7,
"r_x1": 241.9,
"r_y1": 572.7,
"r_x2": 241.9,
"r_y2": 563.8,
"r_x3": 160.4,
"r_y3": 563.8,
"coord_origin": "TOPLEFT"
},
"text": "During training, the",
"orig": "During training, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 245.6,
"r_y0": 572.6,
"r_x1": 286.4,
"r_y1": 572.6,
"r_x2": 286.4,
"r_y2": 563.6,
"r_x3": 245.6,
"r_y3": 563.6,
"coord_origin": "TOPLEFT"
},
"text": "Structure",
"orig": "Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 584.6,
"r_x1": 85.5,
"r_y1": 584.6,
"r_x2": 85.5,
"r_y2": 575.6,
"r_x3": 50.1,
"r_y3": 575.6,
"coord_origin": "TOPLEFT"
},
"text": "Decoder",
"orig": "Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.6,
"r_y0": 584.6,
"r_x1": 286.4,
"r_y1": 584.6,
"r_x2": 286.4,
"r_y2": 575.7,
"r_x3": 88.6,
"r_y3": 575.7,
"coord_origin": "TOPLEFT"
},
"text": "receives \u2018tokenized tags\u2019 of the HTML code that",
"orig": "receives \u2018tokenized tags\u2019 of the HTML code that",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 596.6,
"r_x1": 286.4,
"r_y1": 596.6,
"r_x2": 286.4,
"r_y2": 587.7,
"r_x3": 50.1,
"r_y3": 587.7,
"coord_origin": "TOPLEFT"
},
"text": "represent the table structure. Afterwards, a transformer en-",
"orig": "represent the table structure. Afterwards, a transformer en-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 608.5,
"r_x1": 286.4,
"r_y1": 608.5,
"r_x2": 286.4,
"r_y2": 599.6,
"r_x3": 50.1,
"r_y3": 599.6,
"coord_origin": "TOPLEFT"
},
"text": "coder and decoder architecture is employed to produce fea-",
"orig": "coder and decoder architecture is employed to produce fea-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 620.5,
"r_x1": 240.4,
"r_y1": 620.5,
"r_x2": 240.4,
"r_y2": 611.6,
"r_x3": 50.1,
"r_y3": 611.6,
"coord_origin": "TOPLEFT"
},
"text": "tures that are received by a linear layer, and the",
"orig": "tures that are received by a linear layer, and the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 243.2,
"r_y0": 620.4,
"r_x1": 286.4,
"r_y1": 620.4,
"r_x2": 286.4,
"r_y2": 611.5,
"r_x3": 243.2,
"r_y3": 611.5,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox",
"orig": "Cell BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 632.4,
"r_x1": 286.4,
"r_y1": 632.4,
"r_x2": 286.4,
"r_y2": 623.4,
"r_x3": 50.1,
"r_y3": 623.4,
"coord_origin": "TOPLEFT"
},
"text": "Decoder. The linear layer is applied to the features to",
"orig": "Decoder. The linear layer is applied to the features to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 644.3,
"r_x1": 286.4,
"r_y1": 644.3,
"r_x2": 286.4,
"r_y2": 635.4,
"r_x3": 50.1,
"r_y3": 635.4,
"coord_origin": "TOPLEFT"
},
"text": "predict the tags. Simultaneously, the Cell BBox Decoder",
"orig": "predict the tags. Simultaneously, the Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 656.4,
"r_x1": 220.6,
"r_y1": 656.4,
"r_x2": 220.6,
"r_y2": 647.5,
"r_x3": 50.1,
"r_y3": 647.5,
"coord_origin": "TOPLEFT"
},
"text": "selects features referring to the data cells (\u2018",
"orig": "selects features referring to the data cells (\u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.6,
"r_y0": 656.1,
"r_x1": 228.3,
"r_y1": 656.1,
"r_x2": 228.3,
"r_y2": 647.3,
"r_x3": 220.6,
"r_y3": 647.3,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 228.3,
"r_y0": 656.4,
"r_x1": 236.1,
"r_y1": 656.4,
"r_x2": 236.1,
"r_y2": 647.5,
"r_x3": 228.3,
"r_y3": 647.5,
"coord_origin": "TOPLEFT"
},
"text": "td",
"orig": "td",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 236.1,
"r_y0": 656.1,
"r_x1": 243.8,
"r_y1": 656.1,
"r_x2": 243.8,
"r_y2": 647.3,
"r_x3": 236.1,
"r_y3": 647.3,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 243.8,
"r_y0": 656.4,
"r_x1": 255.3,
"r_y1": 656.4,
"r_x2": 255.3,
"r_y2": 647.5,
"r_x3": 243.8,
"r_y3": 647.5,
"coord_origin": "TOPLEFT"
},
"text": "\u2019, \u2018",
"orig": "\u2019, \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.3,
"r_y0": 656.1,
"r_x1": 263.0,
"r_y1": 656.1,
"r_x2": 263.0,
"r_y2": 647.3,
"r_x3": 255.3,
"r_y3": 647.3,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.0,
"r_y0": 656.4,
"r_x1": 286.4,
"r_y1": 656.4,
"r_x2": 286.4,
"r_y2": 647.5,
"r_x3": 263.0,
"r_y3": 647.5,
"coord_origin": "TOPLEFT"
},
"text": "\u2019) and",
"orig": "\u2019) and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 668.3,
"r_x1": 286.4,
"r_y1": 668.3,
"r_x2": 286.4,
"r_y2": 659.4,
"r_x3": 50.1,
"r_y3": 659.4,
"coord_origin": "TOPLEFT"
},
"text": "passes them through an attention network, an MLP, and a",
"orig": "passes them through an attention network, an MLP, and a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 680.3,
"r_x1": 218.5,
"r_y1": 680.3,
"r_x2": 218.5,
"r_y2": 671.4,
"r_x3": 50.1,
"r_y3": 671.4,
"coord_origin": "TOPLEFT"
},
"text": "linear layer to predict the bounding boxes.",
"orig": "linear layer to predict the bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 4: Given an input image of a table, the Encoder produces fixed-length features that represent the input image. The features are then passed to both the Structure Decoder and Cell BBox Decoder . During training, the Structure Decoder receives 'tokenized tags' of the HTML code that represent the table structure. Afterwards, a transformer encoder and decoder architecture is employed to produce features that are received by a linear layer, and the Cell BBox Decoder. The linear layer is applied to the features to predict the tags. Simultaneously, the Cell BBox Decoder selects features referring to the data cells (' < td > ', ' < ') and passes them through an attention network, an MLP, and a linear layer to predict the bounding boxes."
},
{
"label": "text",
"id": 4,
"page_no": 4,
"cluster": {
"id": 4,
"label": "text",
"bbox": {
"l": 308.9,
"t": 249.5,
"r": 545.1,
"b": 294.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 258.4,
"r_x1": 523.1,
"r_y1": 258.4,
"r_x2": 523.1,
"r_y2": 249.5,
"r_x3": 308.9,
"r_y3": 249.5,
"coord_origin": "TOPLEFT"
},
"text": "forming classification, and adding an adaptive pooling",
"orig": "forming classification, and adding an adaptive pooling",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 525.2,
"r_y0": 258.4,
"r_x1": 545.1,
"r_y1": 258.4,
"r_x2": 545.1,
"r_y2": 249.5,
"r_x3": 525.2,
"r_y3": 249.5,
"coord_origin": "TOPLEFT"
},
"text": "layer",
"orig": "layer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 270.4,
"r_x1": 517.6,
"r_y1": 270.4,
"r_x2": 517.6,
"r_y2": 261.5,
"r_x3": 308.9,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "of size 28*28. ResNet by default downsamples the",
"orig": "of size 28*28. ResNet by default downsamples the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 520.8,
"r_y0": 270.4,
"r_x1": 545.1,
"r_y1": 270.4,
"r_x2": 545.1,
"r_y2": 261.5,
"r_x3": 520.8,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "image",
"orig": "image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 282.4,
"r_x1": 534.8,
"r_y1": 282.4,
"r_x2": 534.8,
"r_y2": 273.4,
"r_x3": 308.9,
"r_y3": 273.4,
"coord_origin": "TOPLEFT"
},
"text": "resolution by 32 and then the encoded image is provided",
"orig": "resolution by 32 and then the encoded image is provided",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 537.4,
"r_y0": 282.4,
"r_x1": 545.1,
"r_y1": 282.4,
"r_x2": 545.1,
"r_y2": 273.4,
"r_x3": 537.4,
"r_y3": 273.4,
"coord_origin": "TOPLEFT"
},
"text": "to",
"orig": "to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 294.3,
"r_x1": 341.2,
"r_y1": 294.3,
"r_x2": 341.2,
"r_y2": 285.4,
"r_x3": 308.9,
"r_y3": 285.4,
"coord_origin": "TOPLEFT"
},
"text": "both the",
"orig": "both the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 343.7,
"r_y0": 294.1,
"r_x1": 417.2,
"r_y1": 294.1,
"r_x2": 417.2,
"r_y2": 285.5,
"r_x3": 343.7,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 417.2,
"r_y0": 294.3,
"r_x1": 436.6,
"r_y1": 294.3,
"r_x2": 436.6,
"r_y2": 285.4,
"r_x3": 417.2,
"r_y3": 285.4,
"coord_origin": "TOPLEFT"
},
"text": ", and",
"orig": ", and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 439.1,
"r_y0": 294.1,
"r_x1": 516.6,
"r_y1": 294.1,
"r_x2": 516.6,
"r_y2": 285.5,
"r_x3": 439.1,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.6,
"r_y0": 294.3,
"r_x1": 519.1,
"r_y1": 294.3,
"r_x2": 519.1,
"r_y2": 285.4,
"r_x3": 516.6,
"r_y3": 285.4,
"coord_origin": "TOPLEFT"
},
"text": ".",
"orig": ".",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "forming classification, and adding an adaptive pooling layer of size 28*28. ResNet by default downsamples the image resolution by 32 and then the encoded image is provided to both the Structure Decoder , and Cell BBox Decoder ."
},
{
"label": "text",
"id": 1,
"page_no": 4,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 308.9,
"t": 297.3,
"r": 545.1,
"b": 414.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 306.3,
"r_x1": 400.9,
"r_y1": 306.3,
"r_x2": 400.9,
"r_y2": 297.3,
"r_x3": 320.8,
"r_y3": 297.3,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder.",
"orig": "Structure Decoder.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.9,
"r_y0": 306.4,
"r_x1": 528.3,
"r_y1": 306.4,
"r_x2": 528.3,
"r_y2": 297.5,
"r_x3": 403.9,
"r_y3": 297.5,
"coord_origin": "TOPLEFT"
},
"text": "The transformer architecture of",
"orig": "The transformer architecture of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 530.7,
"r_y0": 306.4,
"r_x1": 545.1,
"r_y1": 306.4,
"r_x2": 545.1,
"r_y2": 297.5,
"r_x3": 530.7,
"r_y3": 297.5,
"coord_origin": "TOPLEFT"
},
"text": "this",
"orig": "this",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 318.3,
"r_x1": 517.5,
"r_y1": 318.3,
"r_x2": 517.5,
"r_y2": 309.4,
"r_x3": 308.9,
"r_y3": 309.4,
"coord_origin": "TOPLEFT"
},
"text": "component is based on the work proposed in [31].",
"orig": "component is based on the work proposed in [31].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 524.1,
"r_y0": 318.3,
"r_x1": 545.1,
"r_y1": 318.3,
"r_x2": 545.1,
"r_y2": 309.4,
"r_x3": 524.1,
"r_y3": 309.4,
"coord_origin": "TOPLEFT"
},
"text": "After",
"orig": "After",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 330.3,
"r_x1": 432.4,
"r_y1": 330.3,
"r_x2": 432.4,
"r_y2": 321.4,
"r_x3": 308.9,
"r_y3": 321.4,
"coord_origin": "TOPLEFT"
},
"text": "extensive experimentation, the",
"orig": "extensive experimentation, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 435.8,
"r_y0": 330.0,
"r_x1": 510.3,
"r_y1": 330.0,
"r_x2": 510.3,
"r_y2": 321.5,
"r_x3": 435.8,
"r_y3": 321.5,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.0,
"r_y0": 330.3,
"r_x1": 520.6,
"r_y1": 330.3,
"r_x2": 520.6,
"r_y2": 321.4,
"r_x3": 514.0,
"r_y3": 321.4,
"coord_origin": "TOPLEFT"
},
"text": "is",
"orig": "is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 524.1,
"r_y0": 330.3,
"r_x1": 545.1,
"r_y1": 330.3,
"r_x2": 545.1,
"r_y2": 321.4,
"r_x3": 524.1,
"r_y3": 321.4,
"coord_origin": "TOPLEFT"
},
"text": "mod-",
"orig": "mod-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 342.2,
"r_x1": 527.8,
"r_y1": 342.2,
"r_x2": 527.8,
"r_y2": 333.3,
"r_x3": 308.9,
"r_y3": 333.3,
"coord_origin": "TOPLEFT"
},
"text": "eled as a transformer encoder with two encoder layers",
"orig": "eled as a transformer encoder with two encoder layers",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 530.7,
"r_y0": 342.2,
"r_x1": 545.1,
"r_y1": 342.2,
"r_x2": 545.1,
"r_y2": 333.3,
"r_x3": 530.7,
"r_y3": 333.3,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 354.2,
"r_x1": 526.9,
"r_y1": 354.2,
"r_x2": 526.9,
"r_y2": 345.3,
"r_x3": 308.9,
"r_y3": 345.3,
"coord_origin": "TOPLEFT"
},
"text": "a transformer decoder made from a stack of 4 decoder",
"orig": "a transformer decoder made from a stack of 4 decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 529.6,
"r_y0": 354.2,
"r_x1": 545.1,
"r_y1": 354.2,
"r_x2": 545.1,
"r_y2": 345.3,
"r_x3": 529.6,
"r_y3": 345.3,
"coord_origin": "TOPLEFT"
},
"text": "lay-",
"orig": "lay-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 366.1,
"r_x1": 524.5,
"r_y1": 366.1,
"r_x2": 524.5,
"r_y2": 357.2,
"r_x3": 308.9,
"r_y3": 357.2,
"coord_origin": "TOPLEFT"
},
"text": "ers that comprise mainly of multi-head attention and",
"orig": "ers that comprise mainly of multi-head attention and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.0,
"r_y0": 366.1,
"r_x1": 545.1,
"r_y1": 366.1,
"r_x2": 545.1,
"r_y2": 357.2,
"r_x3": 528.0,
"r_y3": 357.2,
"coord_origin": "TOPLEFT"
},
"text": "feed",
"orig": "feed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 378.1,
"r_x1": 370.4,
"r_y1": 378.1,
"r_x2": 370.4,
"r_y2": 369.2,
"r_x3": 308.9,
"r_y3": 369.2,
"coord_origin": "TOPLEFT"
},
"text": "forward layers.",
"orig": "forward layers.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 377.4,
"r_y0": 378.1,
"r_x1": 526.9,
"r_y1": 378.1,
"r_x2": 526.9,
"r_y2": 369.2,
"r_x3": 377.4,
"r_y3": 369.2,
"coord_origin": "TOPLEFT"
},
"text": "This configuration uses fewer layers",
"orig": "This configuration uses fewer layers",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 530.7,
"r_y0": 378.1,
"r_x1": 545.1,
"r_y1": 378.1,
"r_x2": 545.1,
"r_y2": 369.2,
"r_x3": 530.7,
"r_y3": 369.2,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 390.1,
"r_x1": 505.5,
"r_y1": 390.1,
"r_x2": 505.5,
"r_y2": 381.1,
"r_x3": 308.9,
"r_y3": 381.1,
"coord_origin": "TOPLEFT"
},
"text": "heads in comparison to networks applied to other",
"orig": "heads in comparison to networks applied to other",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.0,
"r_y0": 390.1,
"r_x1": 545.1,
"r_y1": 390.1,
"r_x2": 545.1,
"r_y2": 381.1,
"r_x3": 508.0,
"r_y3": 381.1,
"coord_origin": "TOPLEFT"
},
"text": "problems",
"orig": "problems",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 402.0,
"r_x1": 517.7,
"r_y1": 402.0,
"r_x2": 517.7,
"r_y2": 393.1,
"r_x3": 308.9,
"r_y3": 393.1,
"coord_origin": "TOPLEFT"
},
"text": "(e.g. \u201cScene Understanding\u201d, \u201cImage Captioning\u201d),",
"orig": "(e.g. \u201cScene Understanding\u201d, \u201cImage Captioning\u201d),",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 520.8,
"r_y0": 402.0,
"r_x1": 545.1,
"r_y1": 402.0,
"r_x2": 545.1,
"r_y2": 393.1,
"r_x3": 520.8,
"r_y3": 393.1,
"coord_origin": "TOPLEFT"
},
"text": "some-",
"orig": "some-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 414.0,
"r_x1": 528.0,
"r_y1": 414.0,
"r_x2": 528.0,
"r_y2": 405.1,
"r_x3": 308.9,
"r_y3": 405.1,
"coord_origin": "TOPLEFT"
},
"text": "thing which we relate to the simplicity of table images.",
"orig": "thing which we relate to the simplicity of table images.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Structure Decoder. The transformer architecture of this component is based on the work proposed in [31]. After extensive experimentation, the Structure Decoder is modeled as a transformer encoder with two encoder layers and a transformer decoder made from a stack of 4 decoder layers that comprise mainly of multi-head attention and feed forward layers. This configuration uses fewer layers and heads in comparison to networks applied to other problems (e.g. \"Scene Understanding\", \"Image Captioning\"), something which we relate to the simplicity of table images."
},
{
"label": "text",
"id": 3,
"page_no": 4,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 308.9,
"t": 417.1,
"r": 545.1,
"b": 545.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 426.0,
"r_x1": 515.5,
"r_y1": 426.0,
"r_x2": 515.5,
"r_y2": 417.1,
"r_x3": 320.8,
"r_y3": 417.1,
"coord_origin": "TOPLEFT"
},
"text": "The transformer encoder receives an encoded",
"orig": "The transformer encoder receives an encoded",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 520.8,
"r_y0": 426.0,
"r_x1": 545.1,
"r_y1": 426.0,
"r_x2": 545.1,
"r_y2": 417.1,
"r_x3": 520.8,
"r_y3": 417.1,
"coord_origin": "TOPLEFT"
},
"text": "image",
"orig": "image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 438.0,
"r_x1": 343.7,
"r_y1": 438.0,
"r_x2": 343.7,
"r_y2": 429.1,
"r_x3": 308.9,
"r_y3": 429.1,
"coord_origin": "TOPLEFT"
},
"text": "from the",
"orig": "from the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 347.0,
"r_y0": 437.7,
"r_x1": 446.5,
"r_y1": 437.7,
"r_x2": 446.5,
"r_y2": 429.2,
"r_x3": 347.0,
"r_y3": 429.2,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network",
"orig": "CNN Backbone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.9,
"r_y0": 438.0,
"r_x1": 503.1,
"r_y1": 438.0,
"r_x2": 503.1,
"r_y2": 429.1,
"r_x3": 449.9,
"r_y3": 429.1,
"coord_origin": "TOPLEFT"
},
"text": "and refines it",
"orig": "and refines it",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 506.4,
"r_y0": 438.0,
"r_x1": 537.4,
"r_y1": 438.0,
"r_x2": 537.4,
"r_y2": 429.1,
"r_x3": 506.4,
"r_y3": 429.1,
"coord_origin": "TOPLEFT"
},
"text": "through",
"orig": "through",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 540.7,
"r_y0": 438.0,
"r_x1": 545.1,
"r_y1": 438.0,
"r_x2": 545.1,
"r_y2": 429.1,
"r_x3": 540.7,
"r_y3": 429.1,
"coord_origin": "TOPLEFT"
},
"text": "a",
"orig": "a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 449.9,
"r_x1": 522.8,
"r_y1": 449.9,
"r_x2": 522.8,
"r_y2": 441.0,
"r_x3": 308.9,
"r_y3": 441.0,
"coord_origin": "TOPLEFT"
},
"text": "multi-head dot-product attention layer, followed by a",
"orig": "multi-head dot-product attention layer, followed by a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 525.7,
"r_y0": 449.9,
"r_x1": 545.1,
"r_y1": 449.9,
"r_x2": 545.1,
"r_y2": 441.0,
"r_x3": 525.7,
"r_y3": 441.0,
"coord_origin": "TOPLEFT"
},
"text": "Feed",
"orig": "Feed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 461.9,
"r_x1": 384.1,
"r_y1": 461.9,
"r_x2": 384.1,
"r_y2": 453.0,
"r_x3": 308.9,
"r_y3": 453.0,
"coord_origin": "TOPLEFT"
},
"text": "Forward Network.",
"orig": "Forward Network.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.4,
"r_y0": 461.9,
"r_x1": 527.8,
"r_y1": 461.9,
"r_x2": 527.8,
"r_y2": 453.0,
"r_x3": 393.4,
"r_y3": 453.0,
"coord_origin": "TOPLEFT"
},
"text": "During training, the transformer",
"orig": "During training, the transformer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.4,
"r_y0": 461.9,
"r_x1": 545.1,
"r_y1": 461.9,
"r_x2": 545.1,
"r_y2": 453.0,
"r_x3": 532.4,
"r_y3": 453.0,
"coord_origin": "TOPLEFT"
},
"text": "de-",
"orig": "de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 473.8,
"r_x1": 529.8,
"r_y1": 473.8,
"r_x2": 529.8,
"r_y2": 464.9,
"r_x3": 308.9,
"r_y3": 464.9,
"coord_origin": "TOPLEFT"
},
"text": "coder receives as input the output feature produced by",
"orig": "coder receives as input the output feature produced by",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 532.9,
"r_y0": 473.8,
"r_x1": 545.1,
"r_y1": 473.8,
"r_x2": 545.1,
"r_y2": 464.9,
"r_x3": 532.9,
"r_y3": 464.9,
"coord_origin": "TOPLEFT"
},
"text": "the",
"orig": "the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 485.8,
"r_x1": 514.2,
"r_y1": 485.8,
"r_x2": 514.2,
"r_y2": 476.9,
"r_x3": 308.9,
"r_y3": 476.9,
"coord_origin": "TOPLEFT"
},
"text": "transformer encoder, and the tokenized input of the",
"orig": "transformer encoder, and the tokenized input of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.9,
"r_y0": 485.8,
"r_x1": 545.1,
"r_y1": 485.8,
"r_x2": 545.1,
"r_y2": 476.9,
"r_x3": 516.9,
"r_y3": 476.9,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 497.8,
"r_x1": 527.6,
"r_y1": 497.8,
"r_x2": 527.6,
"r_y2": 488.8,
"r_x3": 308.9,
"r_y3": 488.8,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth tags. Using a stack of multi-head attention",
"orig": "ground-truth tags. Using a stack of multi-head attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 529.6,
"r_y0": 497.8,
"r_x1": 545.1,
"r_y1": 497.8,
"r_x2": 545.1,
"r_y2": 488.8,
"r_x3": 529.6,
"r_y3": 488.8,
"coord_origin": "TOPLEFT"
},
"text": "lay-",
"orig": "lay-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 509.7,
"r_x1": 508.4,
"r_y1": 509.7,
"r_x2": 508.4,
"r_y2": 500.8,
"r_x3": 308.9,
"r_y3": 500.8,
"coord_origin": "TOPLEFT"
},
"text": "ers, different aspects of the tag sequence could be",
"orig": "ers, different aspects of the tag sequence could be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.1,
"r_y0": 509.7,
"r_x1": 545.1,
"r_y1": 509.7,
"r_x2": 545.1,
"r_y2": 500.8,
"r_x3": 511.1,
"r_y3": 500.8,
"coord_origin": "TOPLEFT"
},
"text": "inferred.",
"orig": "inferred.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 521.7,
"r_x1": 545.1,
"r_y1": 521.7,
"r_x2": 545.1,
"r_y2": 512.8,
"r_x3": 308.9,
"r_y3": 512.8,
"coord_origin": "TOPLEFT"
},
"text": "This is achieved by each attention head on a layer operating",
"orig": "This is achieved by each attention head on a layer operating",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 533.6,
"r_x1": 545.1,
"r_y1": 533.6,
"r_x2": 545.1,
"r_y2": 524.7,
"r_x3": 308.9,
"r_y3": 524.7,
"coord_origin": "TOPLEFT"
},
"text": "in a different subspace, and then combining altogether their",
"orig": "in a different subspace, and then combining altogether their",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 545.6,
"r_x1": 369.7,
"r_y1": 545.6,
"r_x2": 369.7,
"r_y2": 536.7,
"r_x3": 308.9,
"r_y3": 536.7,
"coord_origin": "TOPLEFT"
},
"text": "attention score.",
"orig": "attention score.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The transformer encoder receives an encoded image from the CNN Backbone Network and refines it through a multi-head dot-product attention layer, followed by a Feed Forward Network. During training, the transformer decoder receives as input the output feature produced by the transformer encoder, and the tokenized input of the HTML ground-truth tags. Using a stack of multi-head attention layers, different aspects of the tag sequence could be inferred. This is achieved by each attention head on a layer operating in a different subspace, and then combining altogether their attention score."
},
{
"label": "text",
"id": 0,
"page_no": 4,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 308.9,
"t": 548.6,
"r": 545.1,
"b": 653.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 557.6,
"r_x1": 404.8,
"r_y1": 557.6,
"r_x2": 404.8,
"r_y2": 548.6,
"r_x3": 320.8,
"r_y3": 548.6,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder.",
"orig": "Cell BBox Decoder.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.3,
"r_y0": 557.6,
"r_x1": 545.1,
"r_y1": 557.6,
"r_x2": 545.1,
"r_y2": 548.7,
"r_x3": 410.3,
"r_y3": 548.7,
"coord_origin": "TOPLEFT"
},
"text": "Our architecture allows to simul-",
"orig": "Our architecture allows to simul-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 569.6,
"r_x1": 545.1,
"r_y1": 569.6,
"r_x2": 545.1,
"r_y2": 560.7,
"r_x3": 308.9,
"r_y3": 560.7,
"coord_origin": "TOPLEFT"
},
"text": "taneously predict HTML tags and bounding boxes for each",
"orig": "taneously predict HTML tags and bounding boxes for each",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 581.5,
"r_x1": 545.1,
"r_y1": 581.5,
"r_x2": 545.1,
"r_y2": 572.6,
"r_x3": 308.9,
"r_y3": 572.6,
"coord_origin": "TOPLEFT"
},
"text": "table cell without the need of a separate object detector end",
"orig": "table cell without the need of a separate object detector end",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 593.5,
"r_x1": 545.1,
"r_y1": 593.5,
"r_x2": 545.1,
"r_y2": 584.6,
"r_x3": 308.9,
"r_y3": 584.6,
"coord_origin": "TOPLEFT"
},
"text": "to end. This approach is inspired by DETR [1] which em-",
"orig": "to end. This approach is inspired by DETR [1] which em-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 605.5,
"r_x1": 545.1,
"r_y1": 605.5,
"r_x2": 545.1,
"r_y2": 596.5,
"r_x3": 308.9,
"r_y3": 596.5,
"coord_origin": "TOPLEFT"
},
"text": "ploys a Transformer Encoder, and Decoder that looks for",
"orig": "ploys a Transformer Encoder, and Decoder that looks for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 617.4,
"r_x1": 545.1,
"r_y1": 617.4,
"r_x2": 545.1,
"r_y2": 608.5,
"r_x3": 308.9,
"r_y3": 608.5,
"coord_origin": "TOPLEFT"
},
"text": "a specific number of object queries (potential object detec-",
"orig": "a specific number of object queries (potential object detec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 629.4,
"r_x1": 545.1,
"r_y1": 629.4,
"r_x2": 545.1,
"r_y2": 620.5,
"r_x3": 308.9,
"r_y3": 620.5,
"coord_origin": "TOPLEFT"
},
"text": "tions). As our model utilizes a transformer architecture, the",
"orig": "tions). As our model utilizes a transformer architecture, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 641.3,
"r_x1": 381.7,
"r_y1": 641.3,
"r_x2": 381.7,
"r_y2": 632.4,
"r_x3": 308.9,
"r_y3": 632.4,
"coord_origin": "TOPLEFT"
},
"text": "hidden state of the",
"orig": "hidden state of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.0,
"r_y0": 641.1,
"r_x1": 391.7,
"r_y1": 641.1,
"r_x2": 391.7,
"r_y2": 632.3,
"r_x3": 384.0,
"r_y3": 632.3,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.7,
"r_y0": 641.3,
"r_x1": 399.5,
"r_y1": 641.3,
"r_x2": 399.5,
"r_y2": 632.4,
"r_x3": 391.7,
"r_y3": 632.4,
"coord_origin": "TOPLEFT"
},
"text": "td",
"orig": "td",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 399.5,
"r_y0": 641.1,
"r_x1": 407.2,
"r_y1": 641.1,
"r_x2": 407.2,
"r_y2": 632.3,
"r_x3": 399.5,
"r_y3": 632.3,
"coord_origin": "TOPLEFT"
},
"text": ">",
"orig": ">",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 407.2,
"r_y0": 641.3,
"r_x1": 432.9,
"r_y1": 641.3,
"r_x2": 432.9,
"r_y2": 632.4,
"r_x3": 407.2,
"r_y3": 632.4,
"coord_origin": "TOPLEFT"
},
"text": "\u2019 and \u2018",
"orig": "\u2019 and \u2018",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 432.9,
"r_y0": 641.1,
"r_x1": 440.7,
"r_y1": 641.1,
"r_x2": 440.7,
"r_y2": 632.3,
"r_x3": 432.9,
"r_y3": 632.3,
"coord_origin": "TOPLEFT"
},
"text": "<",
"orig": "<",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.7,
"r_y0": 641.3,
"r_x1": 545.1,
"r_y1": 641.3,
"r_x2": 545.1,
"r_y2": 632.4,
"r_x3": 440.7,
"r_y3": 632.4,
"coord_origin": "TOPLEFT"
},
"text": "\u2019 HTML structure tags be-",
"orig": "\u2019 HTML structure tags be-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 653.3,
"r_x1": 399.0,
"r_y1": 653.3,
"r_x2": 399.0,
"r_y2": 644.4,
"r_x3": 308.9,
"r_y3": 644.4,
"coord_origin": "TOPLEFT"
},
"text": "come the object query.",
"orig": "come the object query.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Cell BBox Decoder. Our architecture allows to simultaneously predict HTML tags and bounding boxes for each table cell without the need of a separate object detector end to end. This approach is inspired by DETR [1] which employs a Transformer Encoder, and Decoder that looks for a specific number of object queries (potential object detections). As our model utilizes a transformer architecture, the hidden state of the < td > ' and ' < ' HTML structure tags become the object query."
},
{
"label": "text",
"id": 2,
"page_no": 4,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 308.9,
"t": 656.4,
"r": 545.1,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 665.3,
"r_x1": 444.3,
"r_y1": 665.3,
"r_x2": 444.3,
"r_y2": 656.4,
"r_x3": 320.8,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "The encoding generated by the",
"orig": "The encoding generated by the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 447.0,
"r_y0": 665.1,
"r_x1": 545.1,
"r_y1": 665.1,
"r_x2": 545.1,
"r_y2": 656.5,
"r_x3": 447.0,
"r_y3": 656.5,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network",
"orig": "CNN Backbone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 677.3,
"r_x1": 545.1,
"r_y1": 677.3,
"r_x2": 545.1,
"r_y2": 668.4,
"r_x3": 308.9,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "along with the features acquired for every data cell from the",
"orig": "along with the features acquired for every data cell from the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 689.2,
"r_x1": 545.1,
"r_y1": 689.2,
"r_x2": 545.1,
"r_y2": 680.3,
"r_x3": 308.9,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "Transformer Decoder are then passed to the attention net-",
"orig": "Transformer Decoder are then passed to the attention net-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 212,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 308.9,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "work. The attention network takes both inputs and learns to",
"orig": "work. The attention network takes both inputs and learns to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 213,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 545.1,
"r_y1": 713.2,
"r_x2": 545.1,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "provide an attention weighted encoding. This weighted at-",
"orig": "provide an attention weighted encoding. This weighted at-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The encoding generated by the CNN Backbone Network along with the features acquired for every data cell from the Transformer Decoder are then passed to the attention network. The attention network takes both inputs and learns to provide an attention weighted encoding. This weighted at-"
}
],
"headers": [
{
"label": "page_footer",
"id": 9,
"page_no": 4,
"cluster": {
"id": 9,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.87,
"cells": [
{
"index": 214,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5"
}
]
}
},
{
"page_no": 5,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.1,
"r_x1": 286.4,
"r_y1": 84.1,
"r_x2": 286.4,
"r_y2": 75.2,
"r_x3": 50.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "tention encoding is then multiplied to the encoded image to",
"orig": "tention encoding is then multiplied to the encoded image to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 96.1,
"r_x1": 286.4,
"r_y1": 96.1,
"r_x2": 286.4,
"r_y2": 87.2,
"r_x3": 50.1,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "produce a feature for each table cell. Notice that this is dif-",
"orig": "produce a feature for each table cell. Notice that this is dif-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 108.0,
"r_x1": 286.4,
"r_y1": 108.0,
"r_x2": 286.4,
"r_y2": 99.1,
"r_x3": 50.1,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "ferent than the typical object detection problem where im-",
"orig": "ferent than the typical object detection problem where im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 120.0,
"r_x1": 286.4,
"r_y1": 120.0,
"r_x2": 286.4,
"r_y2": 111.1,
"r_x3": 50.1,
"r_y3": 111.1,
"coord_origin": "TOPLEFT"
},
"text": "balances between the number of detections and the amount",
"orig": "balances between the number of detections and the amount",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 131.9,
"r_x1": 286.4,
"r_y1": 131.9,
"r_x2": 286.4,
"r_y2": 123.0,
"r_x3": 50.1,
"r_y3": 123.0,
"coord_origin": "TOPLEFT"
},
"text": "of objects may exist. In our case, we know up front that",
"orig": "of objects may exist. In our case, we know up front that",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 143.9,
"r_x1": 286.4,
"r_y1": 143.9,
"r_x2": 286.4,
"r_y2": 135.0,
"r_x3": 50.1,
"r_y3": 135.0,
"coord_origin": "TOPLEFT"
},
"text": "the produced detections always match with the table cells",
"orig": "the produced detections always match with the table cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 155.8,
"r_x1": 175.2,
"r_y1": 155.8,
"r_x2": 175.2,
"r_y2": 146.9,
"r_x3": 50.1,
"r_y3": 146.9,
"coord_origin": "TOPLEFT"
},
"text": "in number and correspondence.",
"orig": "in number and correspondence.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 168.5,
"r_x1": 286.4,
"r_y1": 168.5,
"r_x2": 286.4,
"r_y2": 159.6,
"r_x3": 62.1,
"r_y3": 159.6,
"coord_origin": "TOPLEFT"
},
"text": "The output features for each table cell are then fed",
"orig": "The output features for each table cell are then fed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 180.5,
"r_x1": 286.4,
"r_y1": 180.5,
"r_x2": 286.4,
"r_y2": 171.6,
"r_x3": 50.1,
"r_y3": 171.6,
"coord_origin": "TOPLEFT"
},
"text": "into the feed-forward network (FFN). The FFN consists",
"orig": "into the feed-forward network (FFN). The FFN consists",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 192.4,
"r_x1": 286.4,
"r_y1": 192.4,
"r_x2": 286.4,
"r_y2": 183.5,
"r_x3": 50.1,
"r_y3": 183.5,
"coord_origin": "TOPLEFT"
},
"text": "of a Multi-Layer Perceptron (3 layers with ReLU activa-",
"orig": "of a Multi-Layer Perceptron (3 layers with ReLU activa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 204.4,
"r_x1": 286.4,
"r_y1": 204.4,
"r_x2": 286.4,
"r_y2": 195.5,
"r_x3": 50.1,
"r_y3": 195.5,
"coord_origin": "TOPLEFT"
},
"text": "tion function) that predicts the normalized coordinates for",
"orig": "tion function) that predicts the normalized coordinates for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 216.4,
"r_x1": 286.4,
"r_y1": 216.4,
"r_x2": 286.4,
"r_y2": 207.4,
"r_x3": 50.1,
"r_y3": 207.4,
"coord_origin": "TOPLEFT"
},
"text": "the bounding box of each table cell. Finally, the predicted",
"orig": "the bounding box of each table cell. Finally, the predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 228.3,
"r_x1": 286.4,
"r_y1": 228.3,
"r_x2": 286.4,
"r_y2": 219.4,
"r_x3": 50.1,
"r_y3": 219.4,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes are classified based on whether they are",
"orig": "bounding boxes are classified based on whether they are",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 240.3,
"r_x1": 181.5,
"r_y1": 240.3,
"r_x2": 181.5,
"r_y2": 231.4,
"r_x3": 50.1,
"r_y3": 231.4,
"coord_origin": "TOPLEFT"
},
"text": "empty or not using a linear layer.",
"orig": "empty or not using a linear layer.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 252.9,
"r_x1": 129.2,
"r_y1": 252.9,
"r_x2": 129.2,
"r_y2": 243.9,
"r_x3": 62.1,
"r_y3": 243.9,
"coord_origin": "TOPLEFT"
},
"text": "Loss Functions.",
"orig": "Loss Functions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.5,
"r_y0": 252.9,
"r_x1": 286.4,
"r_y1": 252.9,
"r_x2": 286.4,
"r_y2": 244.0,
"r_x3": 134.5,
"r_y3": 244.0,
"coord_origin": "TOPLEFT"
},
"text": "We formulate a multi-task loss Eq. 2",
"orig": "We formulate a multi-task loss Eq. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 264.9,
"r_x1": 286.4,
"r_y1": 264.9,
"r_x2": 286.4,
"r_y2": 256.0,
"r_x3": 50.1,
"r_y3": 256.0,
"coord_origin": "TOPLEFT"
},
"text": "to train our network. The Cross-Entropy loss (denoted as",
"orig": "to train our network. The Cross-Entropy loss (denoted as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 276.6,
"r_x1": 56.8,
"r_y1": 276.6,
"r_x2": 56.8,
"r_y2": 267.8,
"r_x3": 50.1,
"r_y3": 267.8,
"coord_origin": "TOPLEFT"
},
"text": "l$_{s}$",
"orig": "l$_{s}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 57.3,
"r_y0": 276.9,
"r_x1": 135.4,
"r_y1": 276.9,
"r_x2": 135.4,
"r_y2": 268.0,
"r_x3": 57.3,
"r_y3": 268.0,
"coord_origin": "TOPLEFT"
},
"text": ") is used to train the",
"orig": ") is used to train the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.7,
"r_y0": 276.6,
"r_x1": 211.1,
"r_y1": 276.6,
"r_x2": 211.1,
"r_y2": 268.0,
"r_x3": 137.7,
"r_y3": 268.0,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 213.6,
"r_y0": 276.9,
"r_x1": 286.4,
"r_y1": 276.9,
"r_x2": 286.4,
"r_y2": 268.0,
"r_x3": 213.6,
"r_y3": 268.0,
"coord_origin": "TOPLEFT"
},
"text": "which predicts the",
"orig": "which predicts the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 288.8,
"r_x1": 158.8,
"r_y1": 288.8,
"r_x2": 158.8,
"r_y2": 279.9,
"r_x3": 50.1,
"r_y3": 279.9,
"coord_origin": "TOPLEFT"
},
"text": "structure tokens. As for the",
"orig": "structure tokens. As for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 161.3,
"r_y0": 288.6,
"r_x1": 238.8,
"r_y1": 288.6,
"r_x2": 238.8,
"r_y2": 280.0,
"r_x3": 161.3,
"r_y3": 280.0,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.5,
"r_y0": 288.8,
"r_x1": 286.4,
"r_y1": 288.8,
"r_x2": 286.4,
"r_y2": 279.9,
"r_x3": 241.5,
"r_y3": 279.9,
"coord_origin": "TOPLEFT"
},
"text": "it is trained",
"orig": "it is trained",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 300.8,
"r_x1": 211.4,
"r_y1": 300.8,
"r_x2": 211.4,
"r_y2": 291.9,
"r_x3": 50.1,
"r_y3": 291.9,
"coord_origin": "TOPLEFT"
},
"text": "with a combination of losses denoted as",
"orig": "with a combination of losses denoted as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 214.3,
"r_y0": 300.5,
"r_x1": 229.2,
"r_y1": 300.5,
"r_x2": 229.2,
"r_y2": 291.7,
"r_x3": 214.3,
"r_y3": 291.7,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.7,
"r_y0": 300.8,
"r_x1": 232.2,
"r_y1": 300.8,
"r_x2": 232.2,
"r_y2": 291.9,
"r_x3": 229.7,
"r_y3": 291.9,
"coord_origin": "TOPLEFT"
},
"text": ".",
"orig": ".",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 236.5,
"r_y0": 300.5,
"r_x1": 251.4,
"r_y1": 300.5,
"r_x2": 251.4,
"r_y2": 291.7,
"r_x3": 236.5,
"r_y3": 291.7,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 254.8,
"r_y0": 300.8,
"r_x1": 286.4,
"r_y1": 300.8,
"r_x2": 286.4,
"r_y2": 291.9,
"r_x3": 254.8,
"r_y3": 291.9,
"coord_origin": "TOPLEFT"
},
"text": "consists",
"orig": "consists",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 312.7,
"r_x1": 137.5,
"r_y1": 312.7,
"r_x2": 137.5,
"r_y2": 303.8,
"r_x3": 50.1,
"r_y3": 303.8,
"coord_origin": "TOPLEFT"
},
"text": "of the generally used",
"orig": "of the generally used",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 141.3,
"r_y0": 312.5,
"r_x1": 148.2,
"r_y1": 312.5,
"r_x2": 148.2,
"r_y2": 303.7,
"r_x3": 141.3,
"r_y3": 303.7,
"coord_origin": "TOPLEFT"
},
"text": "l$_{1}$",
"orig": "l$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 152.6,
"r_y0": 312.7,
"r_x1": 286.4,
"r_y1": 312.7,
"r_x2": 286.4,
"r_y2": 303.8,
"r_x3": 152.6,
"r_y3": 303.8,
"coord_origin": "TOPLEFT"
},
"text": "loss for object detection and the",
"orig": "loss for object detection and the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 324.7,
"r_x1": 89.7,
"r_y1": 324.7,
"r_x2": 89.7,
"r_y2": 315.8,
"r_x3": 50.1,
"r_y3": 315.8,
"coord_origin": "TOPLEFT"
},
"text": "IoU loss (",
"orig": "IoU loss (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.7,
"r_y0": 324.5,
"r_x1": 104.1,
"r_y1": 324.5,
"r_x2": 104.1,
"r_y2": 315.6,
"r_x3": 89.7,
"r_y3": 315.6,
"coord_origin": "TOPLEFT"
},
"text": "l$_{iou}$",
"orig": "l$_{iou}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 104.6,
"r_y0": 324.7,
"r_x1": 286.4,
"r_y1": 324.7,
"r_x2": 286.4,
"r_y2": 315.8,
"r_x3": 104.6,
"r_y3": 315.8,
"coord_origin": "TOPLEFT"
},
"text": ") to be scale invariant as explained in [25]. In",
"orig": ") to be scale invariant as explained in [25]. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 336.6,
"r_x1": 286.4,
"r_y1": 336.6,
"r_x2": 286.4,
"r_y2": 327.7,
"r_x3": 50.1,
"r_y3": 327.7,
"coord_origin": "TOPLEFT"
},
"text": "comparison to DETR, we do not use the Hungarian algo-",
"orig": "comparison to DETR, we do not use the Hungarian algo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 348.6,
"r_x1": 286.4,
"r_y1": 348.6,
"r_x2": 286.4,
"r_y2": 339.7,
"r_x3": 50.1,
"r_y3": 339.7,
"coord_origin": "TOPLEFT"
},
"text": "rithm [15] to match the predicted bounding boxes with the",
"orig": "rithm [15] to match the predicted bounding boxes with the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 360.5,
"r_x1": 286.4,
"r_y1": 360.5,
"r_x2": 286.4,
"r_y2": 351.6,
"r_x3": 50.1,
"r_y3": 351.6,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth boxes, as we have already achieved a one-to-",
"orig": "ground-truth boxes, as we have already achieved a one-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 372.5,
"r_x1": 286.4,
"r_y1": 372.5,
"r_x2": 286.4,
"r_y2": 363.6,
"r_x3": 50.1,
"r_y3": 363.6,
"coord_origin": "TOPLEFT"
},
"text": "one match through two steps: 1) Our token input sequence",
"orig": "one match through two steps: 1) Our token input sequence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 384.5,
"r_x1": 286.4,
"r_y1": 384.5,
"r_x2": 286.4,
"r_y2": 375.5,
"r_x3": 50.1,
"r_y3": 375.5,
"coord_origin": "TOPLEFT"
},
"text": "is naturally ordered, therefore the hidden states of the table",
"orig": "is naturally ordered, therefore the hidden states of the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 396.4,
"r_x1": 286.4,
"r_y1": 396.4,
"r_x2": 286.4,
"r_y2": 387.5,
"r_x3": 50.1,
"r_y3": 387.5,
"coord_origin": "TOPLEFT"
},
"text": "data cells are also in order when they are provided as in-",
"orig": "data cells are also in order when they are provided as in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 408.4,
"r_x1": 88.7,
"r_y1": 408.4,
"r_x2": 88.7,
"r_y2": 399.5,
"r_x3": 50.1,
"r_y3": 399.5,
"coord_origin": "TOPLEFT"
},
"text": "put to the",
"orig": "put to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.6,
"r_y0": 408.1,
"r_x1": 170.1,
"r_y1": 408.1,
"r_x2": 170.1,
"r_y2": 399.5,
"r_x3": 91.6,
"r_y3": 399.5,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 170.1,
"r_y0": 408.4,
"r_x1": 286.4,
"r_y1": 408.4,
"r_x2": 286.4,
"r_y2": 399.5,
"r_x3": 170.1,
"r_y3": 399.5,
"coord_origin": "TOPLEFT"
},
"text": ", and 2) Our bounding boxes",
"orig": ", and 2) Our bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 420.3,
"r_x1": 182.0,
"r_y1": 420.3,
"r_x2": 182.0,
"r_y2": 411.4,
"r_x3": 50.1,
"r_y3": 411.4,
"coord_origin": "TOPLEFT"
},
"text": "generation mechanism (see Sec.",
"orig": "generation mechanism (see Sec.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.1,
"r_y0": 420.3,
"r_x1": 197.7,
"r_y1": 420.3,
"r_x2": 197.7,
"r_y2": 411.4,
"r_x3": 189.1,
"r_y3": 411.4,
"coord_origin": "TOPLEFT"
},
"text": "3)",
"orig": "3)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.3,
"r_y0": 420.3,
"r_x1": 286.4,
"r_y1": 420.3,
"r_x2": 286.4,
"r_y2": 411.4,
"r_x3": 200.3,
"r_y3": 411.4,
"coord_origin": "TOPLEFT"
},
"text": "ensures a one-to-one",
"orig": "ensures a one-to-one",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 432.3,
"r_x1": 286.4,
"r_y1": 432.3,
"r_x2": 286.4,
"r_y2": 423.4,
"r_x3": 50.1,
"r_y3": 423.4,
"coord_origin": "TOPLEFT"
},
"text": "mapping between the cell content and its bounding box for",
"orig": "mapping between the cell content and its bounding box for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 444.2,
"r_x1": 158.3,
"r_y1": 444.2,
"r_x2": 158.3,
"r_y2": 435.3,
"r_x3": 50.1,
"r_y3": 435.3,
"coord_origin": "TOPLEFT"
},
"text": "all post-processed datasets.",
"orig": "all post-processed datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 456.9,
"r_x1": 286.4,
"r_y1": 456.9,
"r_x2": 286.4,
"r_y2": 448.0,
"r_x3": 62.1,
"r_y3": 448.0,
"coord_origin": "TOPLEFT"
},
"text": "The loss used to train the TableFormer can be defined as",
"orig": "The loss used to train the TableFormer can be defined as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 468.9,
"r_x1": 91.4,
"r_y1": 468.9,
"r_x2": 91.4,
"r_y2": 460.0,
"r_x3": 50.1,
"r_y3": 460.0,
"coord_origin": "TOPLEFT"
},
"text": "following:",
"orig": "following:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.7,
"r_y0": 502.1,
"r_x1": 140.6,
"r_y1": 502.1,
"r_x2": 140.6,
"r_y2": 493.3,
"r_x3": 125.7,
"r_y3": 493.3,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.9,
"r_y0": 502.1,
"r_x1": 151.7,
"r_y1": 502.1,
"r_x2": 151.7,
"r_y2": 493.3,
"r_x3": 143.9,
"r_y3": 493.3,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 154.4,
"r_y0": 502.1,
"r_x1": 186.6,
"r_y1": 502.1,
"r_x2": 186.6,
"r_y2": 493.3,
"r_x3": 154.4,
"r_y3": 493.3,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{iou}$l$_{iou}$",
"orig": "\u03bb$_{iou}$l$_{iou}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.3,
"r_y0": 502.1,
"r_x1": 197.1,
"r_y1": 502.1,
"r_x2": 197.1,
"r_y2": 493.3,
"r_x3": 189.3,
"r_y3": 493.3,
"coord_origin": "TOPLEFT"
},
"text": "+",
"orig": "+",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 199.3,
"r_y0": 502.1,
"r_x1": 211.6,
"r_y1": 502.1,
"r_x2": 211.6,
"r_y2": 493.3,
"r_x3": 199.3,
"r_y3": 493.3,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{l}$$_{1}$",
"orig": "\u03bb$_{l}$$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 124.3,
"r_y0": 517.1,
"r_x1": 127.3,
"r_y1": 517.1,
"r_x2": 127.3,
"r_y2": 508.2,
"r_x3": 124.3,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "l",
"orig": "l",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 130.3,
"r_y0": 517.1,
"r_x1": 138.0,
"r_y1": 517.1,
"r_x2": 138.0,
"r_y2": 508.2,
"r_x3": 130.3,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.8,
"r_y0": 517.1,
"r_x1": 153.3,
"r_y1": 517.1,
"r_x2": 153.3,
"r_y2": 508.2,
"r_x3": 140.8,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "\u03bbl$_{s}$",
"orig": "\u03bbl$_{s}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 156.0,
"r_y0": 517.1,
"r_x1": 174.9,
"r_y1": 517.1,
"r_x2": 174.9,
"r_y2": 508.2,
"r_x3": 156.0,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "+ (1",
"orig": "+ (1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 177.1,
"r_y0": 517.1,
"r_x1": 184.8,
"r_y1": 517.1,
"r_x2": 184.8,
"r_y2": 507.7,
"r_x3": 177.1,
"r_y3": 507.7,
"coord_origin": "TOPLEFT"
},
"text": "\u2212",
"orig": "\u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.0,
"r_y0": 517.1,
"r_x1": 192.8,
"r_y1": 517.1,
"r_x2": 192.8,
"r_y2": 508.2,
"r_x3": 187.0,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 192.8,
"r_y0": 517.1,
"r_x1": 196.7,
"r_y1": 517.1,
"r_x2": 196.7,
"r_y2": 508.2,
"r_x3": 192.8,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.7,
"r_y0": 517.1,
"r_x1": 211.6,
"r_y1": 517.1,
"r_x2": 211.6,
"r_y2": 508.2,
"r_x3": 196.7,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.7,
"r_y0": 509.9,
"r_x1": 286.4,
"r_y1": 509.9,
"r_x2": 286.4,
"r_y2": 501.0,
"r_x3": 274.7,
"r_y3": 501.0,
"coord_origin": "TOPLEFT"
},
"text": "(1)",
"orig": "(1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 540.2,
"r_x1": 74.5,
"r_y1": 540.2,
"r_x2": 74.5,
"r_y2": 531.3,
"r_x3": 50.1,
"r_y3": 531.3,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.9,
"r_y0": 540.0,
"r_x1": 82.8,
"r_y1": 540.0,
"r_x2": 82.8,
"r_y2": 531.1,
"r_x3": 76.9,
"r_y3": 531.1,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 85.5,
"r_y0": 540.0,
"r_x1": 92.2,
"r_y1": 540.0,
"r_x2": 92.2,
"r_y2": 530.6,
"r_x3": 85.5,
"r_y3": 530.6,
"coord_origin": "TOPLEFT"
},
"text": "\u2208",
"orig": "\u2208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 94.7,
"r_y0": 540.2,
"r_x1": 135.6,
"r_y1": 540.2,
"r_x2": 135.6,
"r_y2": 531.3,
"r_x3": 94.7,
"r_y3": 531.3,
"coord_origin": "TOPLEFT"
},
"text": "[0, 1], and",
"orig": "[0, 1], and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.1,
"r_y0": 540.0,
"r_x1": 172.6,
"r_y1": 540.0,
"r_x2": 172.6,
"r_y2": 531.1,
"r_x3": 138.1,
"r_y3": 531.1,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$",
"orig": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.9,
"r_y0": 540.0,
"r_x1": 192.5,
"r_y1": 540.0,
"r_x2": 192.5,
"r_y2": 530.6,
"r_x3": 175.9,
"r_y3": 530.6,
"coord_origin": "TOPLEFT"
},
"text": "\u2208$_{R}$",
"orig": "\u2208$_{R}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 195.0,
"r_y0": 540.2,
"r_x1": 281.6,
"r_y1": 540.2,
"r_x2": 281.6,
"r_y2": 531.3,
"r_x3": 195.0,
"r_y3": 531.3,
"coord_origin": "TOPLEFT"
},
"text": "are hyper-parameters.",
"orig": "are hyper-parameters.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 566.7,
"r_x1": 57.9,
"r_y1": 566.7,
"r_x2": 57.9,
"r_y2": 555.9,
"r_x3": 50.1,
"r_y3": 555.9,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.4,
"r_y0": 566.7,
"r_x1": 172.0,
"r_y1": 566.7,
"r_x2": 172.0,
"r_y2": 555.9,
"r_x3": 68.4,
"r_y3": 555.9,
"coord_origin": "TOPLEFT"
},
"text": "Experimental Results",
"orig": "Experimental Results",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 586.1,
"r_x1": 64.7,
"r_y1": 586.1,
"r_x2": 64.7,
"r_y2": 576.3,
"r_x3": 50.1,
"r_y3": 576.3,
"coord_origin": "TOPLEFT"
},
"text": "5.1.",
"orig": "5.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.4,
"r_y0": 586.1,
"r_x1": 179.2,
"r_y1": 586.1,
"r_x2": 179.2,
"r_y2": 576.3,
"r_x3": 74.4,
"r_y3": 576.3,
"coord_origin": "TOPLEFT"
},
"text": "Implementation Details",
"orig": "Implementation Details",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 604.6,
"r_x1": 203.0,
"r_y1": 604.6,
"r_x2": 203.0,
"r_y2": 595.7,
"r_x3": 62.1,
"r_y3": 595.7,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer uses ResNet-18 as the",
"orig": "TableFormer uses ResNet-18 as the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 205.4,
"r_y0": 604.4,
"r_x1": 286.4,
"r_y1": 604.4,
"r_x2": 286.4,
"r_y2": 595.8,
"r_x3": 205.4,
"r_y3": 595.8,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Net-",
"orig": "CNN Backbone Net-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 616.4,
"r_x1": 70.0,
"r_y1": 616.4,
"r_x2": 70.0,
"r_y2": 607.8,
"r_x3": 50.1,
"r_y3": 607.8,
"coord_origin": "TOPLEFT"
},
"text": "work",
"orig": "work",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 616.6,
"r_x1": 286.4,
"r_y1": 616.6,
"r_x2": 286.4,
"r_y2": 607.7,
"r_x3": 70.0,
"r_y3": 607.7,
"coord_origin": "TOPLEFT"
},
"text": ". The input images are resized to 448*448 pixels and",
"orig": ". The input images are resized to 448*448 pixels and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 628.6,
"r_x1": 286.4,
"r_y1": 628.6,
"r_x2": 286.4,
"r_y2": 619.6,
"r_x3": 50.1,
"r_y3": 619.6,
"coord_origin": "TOPLEFT"
},
"text": "the feature map has a dimension of 28*28. Additionally, we",
"orig": "the feature map has a dimension of 28*28. Additionally, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 640.5,
"r_x1": 207.0,
"r_y1": 640.5,
"r_x2": 207.0,
"r_y2": 631.6,
"r_x3": 50.1,
"r_y3": 631.6,
"coord_origin": "TOPLEFT"
},
"text": "enforce the following input constraints:",
"orig": "enforce the following input constraints:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.7,
"r_y0": 663.5,
"r_x1": 186.0,
"r_y1": 663.5,
"r_x2": 186.0,
"r_y2": 654.5,
"r_x3": 91.7,
"r_y3": 654.5,
"coord_origin": "TOPLEFT"
},
"text": "Image width and height",
"orig": "Image width and height",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.5,
"r_y0": 663.2,
"r_x1": 196.3,
"r_y1": 663.2,
"r_x2": 196.3,
"r_y2": 653.8,
"r_x3": 188.5,
"r_y3": 653.8,
"coord_origin": "TOPLEFT"
},
"text": "\u2264",
"orig": "\u2264",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 198.7,
"r_y0": 663.5,
"r_x1": 244.8,
"r_y1": 663.5,
"r_x2": 244.8,
"r_y2": 654.5,
"r_x3": 198.7,
"r_y3": 654.5,
"coord_origin": "TOPLEFT"
},
"text": "1024 pixels",
"orig": "1024 pixels",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.0,
"r_y0": 678.4,
"r_x1": 186.2,
"r_y1": 678.4,
"r_x2": 186.2,
"r_y2": 669.5,
"r_x3": 101.0,
"r_y3": 669.5,
"coord_origin": "TOPLEFT"
},
"text": "Structural tags length",
"orig": "Structural tags length",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.7,
"r_y0": 678.2,
"r_x1": 196.5,
"r_y1": 678.2,
"r_x2": 196.5,
"r_y2": 668.8,
"r_x3": 188.7,
"r_y3": 668.8,
"coord_origin": "TOPLEFT"
},
"text": "\u2264",
"orig": "\u2264",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 199.0,
"r_y0": 678.4,
"r_x1": 244.8,
"r_y1": 678.4,
"r_x2": 244.8,
"r_y2": 669.5,
"r_x3": 199.0,
"r_y3": 669.5,
"coord_origin": "TOPLEFT"
},
"text": "512 tokens.",
"orig": "512 tokens.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.7,
"r_y0": 671.0,
"r_x1": 286.4,
"r_y1": 671.0,
"r_x2": 286.4,
"r_y2": 662.1,
"r_x3": 274.7,
"r_y3": 662.1,
"coord_origin": "TOPLEFT"
},
"text": "(2)",
"orig": "(2)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "Although input constraints are used also by other methods,",
"orig": "Although input constraints are used also by other methods,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 286.4,
"r_y1": 713.2,
"r_x2": 286.4,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "such as EDD, ours are less restrictive due to the improved",
"orig": "such as EDD, ours are less restrictive due to the improved",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 84.1,
"r_x1": 545.1,
"r_y1": 84.1,
"r_x2": 545.1,
"r_y2": 75.2,
"r_x3": 308.9,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "runtime performance and lower memory footprint of Table-",
"orig": "runtime performance and lower memory footprint of Table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 96.1,
"r_x1": 340.0,
"r_y1": 96.1,
"r_x2": 340.0,
"r_y2": 87.2,
"r_x3": 308.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "Former.",
"orig": "Former.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.9,
"r_y0": 96.1,
"r_x1": 545.1,
"r_y1": 96.1,
"r_x2": 545.1,
"r_y2": 87.2,
"r_x3": 346.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "This allows to utilize input samples with longer",
"orig": "This allows to utilize input samples with longer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 108.0,
"r_x1": 493.0,
"r_y1": 108.0,
"r_x2": 493.0,
"r_y2": 99.1,
"r_x3": 308.9,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "sequences and images with larger dimensions.",
"orig": "sequences and images with larger dimensions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 125.1,
"r_x1": 545.1,
"r_y1": 125.1,
"r_x2": 545.1,
"r_y2": 116.2,
"r_x3": 320.8,
"r_y3": 116.2,
"coord_origin": "TOPLEFT"
},
"text": "The Transformer Encoder consists of two \u201cTransformer",
"orig": "The Transformer Encoder consists of two \u201cTransformer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 137.1,
"r_x1": 545.1,
"r_y1": 137.1,
"r_x2": 545.1,
"r_y2": 128.2,
"r_x3": 308.9,
"r_y3": 128.2,
"coord_origin": "TOPLEFT"
},
"text": "Encoder Layers\u201d, with an input feature size of 512, feed",
"orig": "Encoder Layers\u201d, with an input feature size of 512, feed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 149.0,
"r_x1": 545.1,
"r_y1": 149.0,
"r_x2": 545.1,
"r_y2": 140.1,
"r_x3": 308.9,
"r_y3": 140.1,
"coord_origin": "TOPLEFT"
},
"text": "forward network of 1024, and 4 attention heads. As for the",
"orig": "forward network of 1024, and 4 attention heads. As for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 161.0,
"r_x1": 545.1,
"r_y1": 161.0,
"r_x2": 545.1,
"r_y2": 152.1,
"r_x3": 308.9,
"r_y3": 152.1,
"coord_origin": "TOPLEFT"
},
"text": "Transformer Decoder it is composed of four \u201cTransformer",
"orig": "Transformer Decoder it is composed of four \u201cTransformer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 173.0,
"r_x1": 545.1,
"r_y1": 173.0,
"r_x2": 545.1,
"r_y2": 164.0,
"r_x3": 308.9,
"r_y3": 164.0,
"coord_origin": "TOPLEFT"
},
"text": "Decoder Layers\u201d with similar input and output dimensions",
"orig": "Decoder Layers\u201d with similar input and output dimensions",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 184.9,
"r_x1": 467.2,
"r_y1": 184.9,
"r_x2": 467.2,
"r_y2": 176.0,
"r_x3": 308.9,
"r_y3": 176.0,
"coord_origin": "TOPLEFT"
},
"text": "as the \u201cTransformer Encoder Layers\u201d.",
"orig": "as the \u201cTransformer Encoder Layers\u201d.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 475.4,
"r_y0": 184.9,
"r_x1": 545.1,
"r_y1": 184.9,
"r_x2": 545.1,
"r_y2": 176.0,
"r_x3": 475.4,
"r_y3": 176.0,
"coord_origin": "TOPLEFT"
},
"text": "Even though our",
"orig": "Even though our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 196.9,
"r_x1": 545.1,
"r_y1": 196.9,
"r_x2": 545.1,
"r_y2": 188.0,
"r_x3": 308.9,
"r_y3": 188.0,
"coord_origin": "TOPLEFT"
},
"text": "model uses fewer layers and heads than the default imple-",
"orig": "model uses fewer layers and heads than the default imple-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 208.8,
"r_x1": 545.1,
"r_y1": 208.8,
"r_x2": 545.1,
"r_y2": 199.9,
"r_x3": 308.9,
"r_y3": 199.9,
"coord_origin": "TOPLEFT"
},
"text": "mentation parameters, our extensive experimentation has",
"orig": "mentation parameters, our extensive experimentation has",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 220.8,
"r_x1": 545.1,
"r_y1": 220.8,
"r_x2": 545.1,
"r_y2": 211.9,
"r_x3": 308.9,
"r_y3": 211.9,
"coord_origin": "TOPLEFT"
},
"text": "proved this setup to be more suitable for table images. We",
"orig": "proved this setup to be more suitable for table images. We",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 232.7,
"r_x1": 545.1,
"r_y1": 232.7,
"r_x2": 545.1,
"r_y2": 223.8,
"r_x3": 308.9,
"r_y3": 223.8,
"coord_origin": "TOPLEFT"
},
"text": "attribute this finding to the inherent design of table im-",
"orig": "attribute this finding to the inherent design of table im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 244.7,
"r_x1": 545.1,
"r_y1": 244.7,
"r_x2": 545.1,
"r_y2": 235.8,
"r_x3": 308.9,
"r_y3": 235.8,
"coord_origin": "TOPLEFT"
},
"text": "ages, which contain mostly lines and text, unlike the more",
"orig": "ages, which contain mostly lines and text, unlike the more",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 256.6,
"r_x1": 545.1,
"r_y1": 256.6,
"r_x2": 545.1,
"r_y2": 247.7,
"r_x3": 308.9,
"r_y3": 247.7,
"coord_origin": "TOPLEFT"
},
"text": "elaborate content present in other scopes (e.g. the COCO",
"orig": "elaborate content present in other scopes (e.g. the COCO",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 268.6,
"r_x1": 342.3,
"r_y1": 268.6,
"r_x2": 342.3,
"r_y2": 259.7,
"r_x3": 308.9,
"r_y3": 259.7,
"coord_origin": "TOPLEFT"
},
"text": "dataset).",
"orig": "dataset).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 349.0,
"r_y0": 268.6,
"r_x1": 545.1,
"r_y1": 268.6,
"r_x2": 545.1,
"r_y2": 259.7,
"r_x3": 349.0,
"r_y3": 259.7,
"coord_origin": "TOPLEFT"
},
"text": "Moreover, we have added ResNet blocks to the",
"orig": "Moreover, we have added ResNet blocks to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 280.6,
"r_x1": 545.1,
"r_y1": 280.6,
"r_x2": 545.1,
"r_y2": 271.6,
"r_x3": 308.9,
"r_y3": 271.6,
"coord_origin": "TOPLEFT"
},
"text": "inputs of the Structure Decoder and Cell BBox Decoder.",
"orig": "inputs of the Structure Decoder and Cell BBox Decoder.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 292.5,
"r_x1": 545.1,
"r_y1": 292.5,
"r_x2": 545.1,
"r_y2": 283.6,
"r_x3": 308.9,
"r_y3": 283.6,
"coord_origin": "TOPLEFT"
},
"text": "This prevents a decoder having a stronger influence over the",
"orig": "This prevents a decoder having a stronger influence over the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 304.5,
"r_x1": 545.1,
"r_y1": 304.5,
"r_x2": 545.1,
"r_y2": 295.6,
"r_x3": 308.9,
"r_y3": 295.6,
"coord_origin": "TOPLEFT"
},
"text": "learned weights which would damage the other prediction",
"orig": "learned weights which would damage the other prediction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 316.4,
"r_x1": 545.1,
"r_y1": 316.4,
"r_x2": 545.1,
"r_y2": 307.5,
"r_x3": 308.9,
"r_y3": 307.5,
"coord_origin": "TOPLEFT"
},
"text": "task (structure vs bounding boxes), but learn task specific",
"orig": "task (structure vs bounding boxes), but learn task specific",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 328.4,
"r_x1": 532.5,
"r_y1": 328.4,
"r_x2": 532.5,
"r_y2": 319.5,
"r_x3": 308.9,
"r_y3": 319.5,
"coord_origin": "TOPLEFT"
},
"text": "weights instead. Lastly our dropout layers are set to 0.5.",
"orig": "weights instead. Lastly our dropout layers are set to 0.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 345.5,
"r_x1": 545.1,
"r_y1": 345.5,
"r_x2": 545.1,
"r_y2": 336.6,
"r_x3": 320.8,
"r_y3": 336.6,
"coord_origin": "TOPLEFT"
},
"text": "For training, TableFormer is trained with 3 Adam opti-",
"orig": "For training, TableFormer is trained with 3 Adam opti-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 357.4,
"r_x1": 403.7,
"r_y1": 357.4,
"r_x2": 403.7,
"r_y2": 348.5,
"r_x3": 308.9,
"r_y3": 348.5,
"coord_origin": "TOPLEFT"
},
"text": "mizers, each one for the",
"orig": "mizers, each one for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.1,
"r_y0": 357.2,
"r_x1": 503.5,
"r_y1": 357.2,
"r_x2": 503.5,
"r_y2": 348.6,
"r_x3": 406.1,
"r_y3": 348.6,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network",
"orig": "CNN Backbone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 503.5,
"r_y0": 357.4,
"r_x1": 506.0,
"r_y1": 357.4,
"r_x2": 506.0,
"r_y2": 348.5,
"r_x3": 503.5,
"r_y3": 348.5,
"coord_origin": "TOPLEFT"
},
"text": ",",
"orig": ",",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.4,
"r_y0": 357.2,
"r_x1": 545.1,
"r_y1": 357.2,
"r_x2": 545.1,
"r_y2": 348.6,
"r_x3": 508.4,
"r_y3": 348.6,
"coord_origin": "TOPLEFT"
},
"text": "Structure",
"orig": "Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 369.2,
"r_x1": 343.2,
"r_y1": 369.2,
"r_x2": 343.2,
"r_y2": 360.6,
"r_x3": 308.9,
"r_y3": 360.6,
"coord_origin": "TOPLEFT"
},
"text": "Decoder",
"orig": "Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 343.2,
"r_y0": 369.4,
"r_x1": 362.2,
"r_y1": 369.4,
"r_x2": 362.2,
"r_y2": 360.5,
"r_x3": 343.2,
"r_y3": 360.5,
"coord_origin": "TOPLEFT"
},
"text": ", and",
"orig": ", and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 364.3,
"r_y0": 369.2,
"r_x1": 440.9,
"r_y1": 369.2,
"r_x2": 440.9,
"r_y2": 360.6,
"r_x3": 364.3,
"r_y3": 360.6,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.9,
"r_y0": 369.4,
"r_x1": 545.1,
"r_y1": 369.4,
"r_x2": 545.1,
"r_y2": 360.5,
"r_x3": 440.9,
"r_y3": 360.5,
"coord_origin": "TOPLEFT"
},
"text": ". Taking the PubTabNet as",
"orig": ". Taking the PubTabNet as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 381.3,
"r_x1": 545.1,
"r_y1": 381.3,
"r_x2": 545.1,
"r_y2": 372.4,
"r_x3": 308.9,
"r_y3": 372.4,
"coord_origin": "TOPLEFT"
},
"text": "an example for our parameter set up, the initializing learn-",
"orig": "an example for our parameter set up, the initializing learn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 393.3,
"r_x1": 545.1,
"r_y1": 393.3,
"r_x2": 545.1,
"r_y2": 384.4,
"r_x3": 308.9,
"r_y3": 384.4,
"coord_origin": "TOPLEFT"
},
"text": "ing rate is 0.001 for 12 epochs with a batch size of 24, and",
"orig": "ing rate is 0.001 for 12 epochs with a batch size of 24, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 405.0,
"r_x1": 314.7,
"r_y1": 405.0,
"r_x2": 314.7,
"r_y2": 396.2,
"r_x3": 308.9,
"r_y3": 396.2,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.7,
"r_y0": 405.3,
"r_x1": 360.4,
"r_y1": 405.3,
"r_x2": 360.4,
"r_y2": 396.4,
"r_x3": 318.7,
"r_y3": 396.4,
"coord_origin": "TOPLEFT"
},
"text": "set to 0.5.",
"orig": "set to 0.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 368.0,
"r_y0": 405.3,
"r_x1": 545.1,
"r_y1": 405.3,
"r_x2": 545.1,
"r_y2": 396.4,
"r_x3": 368.0,
"r_y3": 396.4,
"coord_origin": "TOPLEFT"
},
"text": "Afterwards, we reduce the learning rate to",
"orig": "Afterwards, we reduce the learning rate to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 417.2,
"r_x1": 545.1,
"r_y1": 417.2,
"r_x2": 545.1,
"r_y2": 408.3,
"r_x3": 308.9,
"r_y3": 408.3,
"coord_origin": "TOPLEFT"
},
"text": "0.0001, the batch size to 18 and train for 12 more epochs or",
"orig": "0.0001, the batch size to 18 and train for 12 more epochs or",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 429.2,
"r_x1": 361.0,
"r_y1": 429.2,
"r_x2": 361.0,
"r_y2": 420.3,
"r_x3": 308.9,
"r_y3": 420.3,
"coord_origin": "TOPLEFT"
},
"text": "convergence.",
"orig": "convergence.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 446.3,
"r_x1": 545.1,
"r_y1": 446.3,
"r_x2": 545.1,
"r_y2": 437.4,
"r_x3": 320.8,
"r_y3": 437.4,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer is implemented with PyTorch and Torchvi-",
"orig": "TableFormer is implemented with PyTorch and Torchvi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 458.2,
"r_x1": 384.6,
"r_y1": 458.2,
"r_x2": 384.6,
"r_y2": 449.3,
"r_x3": 308.9,
"r_y3": 449.3,
"coord_origin": "TOPLEFT"
},
"text": "sion libraries [22].",
"orig": "sion libraries [22].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.4,
"r_y0": 458.2,
"r_x1": 545.1,
"r_y1": 458.2,
"r_x2": 545.1,
"r_y2": 449.3,
"r_x3": 391.4,
"r_y3": 449.3,
"coord_origin": "TOPLEFT"
},
"text": "To speed up the inference, the image",
"orig": "To speed up the inference, the image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 470.2,
"r_x1": 494.0,
"r_y1": 470.2,
"r_x2": 494.0,
"r_y2": 461.3,
"r_x3": 308.9,
"r_y3": 461.3,
"coord_origin": "TOPLEFT"
},
"text": "undergoes a single forward pass through the",
"orig": "undergoes a single forward pass through the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.1,
"r_y0": 470.0,
"r_x1": 545.1,
"r_y1": 470.0,
"r_x2": 545.1,
"r_y2": 461.4,
"r_x3": 498.1,
"r_y3": 461.4,
"coord_origin": "TOPLEFT"
},
"text": "CNN Back-",
"orig": "CNN Back-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 481.9,
"r_x1": 364.4,
"r_y1": 481.9,
"r_x2": 364.4,
"r_y2": 473.3,
"r_x3": 308.9,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "bone Network",
"orig": "bone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.1,
"r_y0": 482.1,
"r_x1": 545.1,
"r_y1": 482.1,
"r_x2": 545.1,
"r_y2": 473.2,
"r_x3": 367.1,
"r_y3": 473.2,
"coord_origin": "TOPLEFT"
},
"text": "and transformer encoder. This eliminates the",
"orig": "and transformer encoder. This eliminates the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 494.1,
"r_x1": 545.1,
"r_y1": 494.1,
"r_x2": 545.1,
"r_y2": 485.2,
"r_x3": 308.9,
"r_y3": 485.2,
"coord_origin": "TOPLEFT"
},
"text": "overhead of generating the same features for each decoding",
"orig": "overhead of generating the same features for each decoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 506.1,
"r_x1": 545.1,
"r_y1": 506.1,
"r_x2": 545.1,
"r_y2": 497.1,
"r_x3": 308.9,
"r_y3": 497.1,
"coord_origin": "TOPLEFT"
},
"text": "step. Similarly, we employ a \u2019caching\u2019 technique to preform",
"orig": "step. Similarly, we employ a \u2019caching\u2019 technique to preform",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 518.0,
"r_x1": 545.1,
"r_y1": 518.0,
"r_x2": 545.1,
"r_y2": 509.1,
"r_x3": 308.9,
"r_y3": 509.1,
"coord_origin": "TOPLEFT"
},
"text": "faster autoregressive decoding. This is achieved by storing",
"orig": "faster autoregressive decoding. This is achieved by storing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 530.0,
"r_x1": 545.1,
"r_y1": 530.0,
"r_x2": 545.1,
"r_y2": 521.1,
"r_x3": 308.9,
"r_y3": 521.1,
"coord_origin": "TOPLEFT"
},
"text": "the features of decoded tokens so we can reuse them for",
"orig": "the features of decoded tokens so we can reuse them for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 541.9,
"r_x1": 545.1,
"r_y1": 541.9,
"r_x2": 545.1,
"r_y2": 533.0,
"r_x3": 308.9,
"r_y3": 533.0,
"coord_origin": "TOPLEFT"
},
"text": "each time step. Therefore, we only compute the attention",
"orig": "each time step. Therefore, we only compute the attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 553.9,
"r_x1": 377.2,
"r_y1": 553.9,
"r_x2": 377.2,
"r_y2": 545.0,
"r_x3": 308.9,
"r_y3": 545.0,
"coord_origin": "TOPLEFT"
},
"text": "for each new tag.",
"orig": "for each new tag.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 589.4,
"r_x1": 323.9,
"r_y1": 589.4,
"r_x2": 323.9,
"r_y2": 579.6,
"r_x3": 308.9,
"r_y3": 579.6,
"coord_origin": "TOPLEFT"
},
"text": "5.2.",
"orig": "5.2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.9,
"r_y0": 589.4,
"r_x1": 397.4,
"r_y1": 589.4,
"r_x2": 397.4,
"r_y2": 579.6,
"r_x3": 333.9,
"r_y3": 579.6,
"coord_origin": "TOPLEFT"
},
"text": "Generalization",
"orig": "Generalization",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 612.4,
"r_x1": 545.1,
"r_y1": 612.4,
"r_x2": 545.1,
"r_y2": 603.4,
"r_x3": 320.8,
"r_y3": 603.4,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer is evaluated on three major publicly avail-",
"orig": "TableFormer is evaluated on three major publicly avail-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 624.3,
"r_x1": 545.1,
"r_y1": 624.3,
"r_x2": 545.1,
"r_y2": 615.4,
"r_x3": 308.9,
"r_y3": 615.4,
"coord_origin": "TOPLEFT"
},
"text": "able datasets of different nature to prove the generalization",
"orig": "able datasets of different nature to prove the generalization",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 636.3,
"r_x1": 545.1,
"r_y1": 636.3,
"r_x2": 545.1,
"r_y2": 627.4,
"r_x3": 308.9,
"r_y3": 627.4,
"coord_origin": "TOPLEFT"
},
"text": "and effectiveness of our model. The datasets used for eval-",
"orig": "and effectiveness of our model. The datasets used for eval-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 648.2,
"r_x1": 545.1,
"r_y1": 648.2,
"r_x2": 545.1,
"r_y2": 639.3,
"r_x3": 308.9,
"r_y3": 639.3,
"coord_origin": "TOPLEFT"
},
"text": "uation are the PubTabNet, FinTabNet and TableBank which",
"orig": "uation are the PubTabNet, FinTabNet and TableBank which",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 660.2,
"r_x1": 545.1,
"r_y1": 660.2,
"r_x2": 545.1,
"r_y2": 651.3,
"r_x3": 308.9,
"r_y3": 651.3,
"coord_origin": "TOPLEFT"
},
"text": "stem from the scientific, financial and general domains re-",
"orig": "stem from the scientific, financial and general domains re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 672.1,
"r_x1": 350.7,
"r_y1": 672.1,
"r_x2": 350.7,
"r_y2": 663.2,
"r_x3": 308.9,
"r_y3": 663.2,
"coord_origin": "TOPLEFT"
},
"text": "spectively.",
"orig": "spectively.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 689.2,
"r_x1": 545.1,
"r_y1": 689.2,
"r_x2": 545.1,
"r_y2": 680.3,
"r_x3": 320.8,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "We also share our baseline results on the challenging",
"orig": "We also share our baseline results on the challenging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 701.2,
"r_x1": 396.2,
"r_y1": 701.2,
"r_x2": 396.2,
"r_y2": 692.3,
"r_x3": 308.9,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet dataset.",
"orig": "SynthTabNet dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.4,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 406.4,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "Throughout our experiments, the",
"orig": "Throughout our experiments, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 495.9,
"r_y1": 713.2,
"r_x2": 495.9,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "same parameters stated in Sec. 5.1 are utilized.",
"orig": "same parameters stated in Sec. 5.1 are utilized.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 5,
"label": "text",
"bbox": {
"l": 50.1,
"t": 75.2,
"r": 286.4,
"b": 155.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.1,
"r_x1": 286.4,
"r_y1": 84.1,
"r_x2": 286.4,
"r_y2": 75.2,
"r_x3": 50.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "tention encoding is then multiplied to the encoded image to",
"orig": "tention encoding is then multiplied to the encoded image to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 96.1,
"r_x1": 286.4,
"r_y1": 96.1,
"r_x2": 286.4,
"r_y2": 87.2,
"r_x3": 50.1,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "produce a feature for each table cell. Notice that this is dif-",
"orig": "produce a feature for each table cell. Notice that this is dif-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 108.0,
"r_x1": 286.4,
"r_y1": 108.0,
"r_x2": 286.4,
"r_y2": 99.1,
"r_x3": 50.1,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "ferent than the typical object detection problem where im-",
"orig": "ferent than the typical object detection problem where im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 120.0,
"r_x1": 286.4,
"r_y1": 120.0,
"r_x2": 286.4,
"r_y2": 111.1,
"r_x3": 50.1,
"r_y3": 111.1,
"coord_origin": "TOPLEFT"
},
"text": "balances between the number of detections and the amount",
"orig": "balances between the number of detections and the amount",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 131.9,
"r_x1": 286.4,
"r_y1": 131.9,
"r_x2": 286.4,
"r_y2": 123.0,
"r_x3": 50.1,
"r_y3": 123.0,
"coord_origin": "TOPLEFT"
},
"text": "of objects may exist. In our case, we know up front that",
"orig": "of objects may exist. In our case, we know up front that",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 143.9,
"r_x1": 286.4,
"r_y1": 143.9,
"r_x2": 286.4,
"r_y2": 135.0,
"r_x3": 50.1,
"r_y3": 135.0,
"coord_origin": "TOPLEFT"
},
"text": "the produced detections always match with the table cells",
"orig": "the produced detections always match with the table cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 155.8,
"r_x1": 175.2,
"r_y1": 155.8,
"r_x2": 175.2,
"r_y2": 146.9,
"r_x3": 50.1,
"r_y3": 146.9,
"coord_origin": "TOPLEFT"
},
"text": "in number and correspondence.",
"orig": "in number and correspondence.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 6,
"label": "text",
"bbox": {
"l": 50.1,
"t": 159.6,
"r": 286.4,
"b": 240.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 168.5,
"r_x1": 286.4,
"r_y1": 168.5,
"r_x2": 286.4,
"r_y2": 159.6,
"r_x3": 62.1,
"r_y3": 159.6,
"coord_origin": "TOPLEFT"
},
"text": "The output features for each table cell are then fed",
"orig": "The output features for each table cell are then fed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 180.5,
"r_x1": 286.4,
"r_y1": 180.5,
"r_x2": 286.4,
"r_y2": 171.6,
"r_x3": 50.1,
"r_y3": 171.6,
"coord_origin": "TOPLEFT"
},
"text": "into the feed-forward network (FFN). The FFN consists",
"orig": "into the feed-forward network (FFN). The FFN consists",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 192.4,
"r_x1": 286.4,
"r_y1": 192.4,
"r_x2": 286.4,
"r_y2": 183.5,
"r_x3": 50.1,
"r_y3": 183.5,
"coord_origin": "TOPLEFT"
},
"text": "of a Multi-Layer Perceptron (3 layers with ReLU activa-",
"orig": "of a Multi-Layer Perceptron (3 layers with ReLU activa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 204.4,
"r_x1": 286.4,
"r_y1": 204.4,
"r_x2": 286.4,
"r_y2": 195.5,
"r_x3": 50.1,
"r_y3": 195.5,
"coord_origin": "TOPLEFT"
},
"text": "tion function) that predicts the normalized coordinates for",
"orig": "tion function) that predicts the normalized coordinates for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 216.4,
"r_x1": 286.4,
"r_y1": 216.4,
"r_x2": 286.4,
"r_y2": 207.4,
"r_x3": 50.1,
"r_y3": 207.4,
"coord_origin": "TOPLEFT"
},
"text": "the bounding box of each table cell. Finally, the predicted",
"orig": "the bounding box of each table cell. Finally, the predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 228.3,
"r_x1": 286.4,
"r_y1": 228.3,
"r_x2": 286.4,
"r_y2": 219.4,
"r_x3": 50.1,
"r_y3": 219.4,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes are classified based on whether they are",
"orig": "bounding boxes are classified based on whether they are",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 240.3,
"r_x1": 181.5,
"r_y1": 240.3,
"r_x2": 181.5,
"r_y2": 231.4,
"r_x3": 50.1,
"r_y3": 231.4,
"coord_origin": "TOPLEFT"
},
"text": "empty or not using a linear layer.",
"orig": "empty or not using a linear layer.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "text",
"bbox": {
"l": 50.1,
"t": 243.9,
"r": 286.4,
"b": 444.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 252.9,
"r_x1": 129.2,
"r_y1": 252.9,
"r_x2": 129.2,
"r_y2": 243.9,
"r_x3": 62.1,
"r_y3": 243.9,
"coord_origin": "TOPLEFT"
},
"text": "Loss Functions.",
"orig": "Loss Functions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.5,
"r_y0": 252.9,
"r_x1": 286.4,
"r_y1": 252.9,
"r_x2": 286.4,
"r_y2": 244.0,
"r_x3": 134.5,
"r_y3": 244.0,
"coord_origin": "TOPLEFT"
},
"text": "We formulate a multi-task loss Eq. 2",
"orig": "We formulate a multi-task loss Eq. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 264.9,
"r_x1": 286.4,
"r_y1": 264.9,
"r_x2": 286.4,
"r_y2": 256.0,
"r_x3": 50.1,
"r_y3": 256.0,
"coord_origin": "TOPLEFT"
},
"text": "to train our network. The Cross-Entropy loss (denoted as",
"orig": "to train our network. The Cross-Entropy loss (denoted as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 276.6,
"r_x1": 56.8,
"r_y1": 276.6,
"r_x2": 56.8,
"r_y2": 267.8,
"r_x3": 50.1,
"r_y3": 267.8,
"coord_origin": "TOPLEFT"
},
"text": "l$_{s}$",
"orig": "l$_{s}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 57.3,
"r_y0": 276.9,
"r_x1": 135.4,
"r_y1": 276.9,
"r_x2": 135.4,
"r_y2": 268.0,
"r_x3": 57.3,
"r_y3": 268.0,
"coord_origin": "TOPLEFT"
},
"text": ") is used to train the",
"orig": ") is used to train the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.7,
"r_y0": 276.6,
"r_x1": 211.1,
"r_y1": 276.6,
"r_x2": 211.1,
"r_y2": 268.0,
"r_x3": 137.7,
"r_y3": 268.0,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 213.6,
"r_y0": 276.9,
"r_x1": 286.4,
"r_y1": 276.9,
"r_x2": 286.4,
"r_y2": 268.0,
"r_x3": 213.6,
"r_y3": 268.0,
"coord_origin": "TOPLEFT"
},
"text": "which predicts the",
"orig": "which predicts the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 288.8,
"r_x1": 158.8,
"r_y1": 288.8,
"r_x2": 158.8,
"r_y2": 279.9,
"r_x3": 50.1,
"r_y3": 279.9,
"coord_origin": "TOPLEFT"
},
"text": "structure tokens. As for the",
"orig": "structure tokens. As for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 161.3,
"r_y0": 288.6,
"r_x1": 238.8,
"r_y1": 288.6,
"r_x2": 238.8,
"r_y2": 280.0,
"r_x3": 161.3,
"r_y3": 280.0,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.5,
"r_y0": 288.8,
"r_x1": 286.4,
"r_y1": 288.8,
"r_x2": 286.4,
"r_y2": 279.9,
"r_x3": 241.5,
"r_y3": 279.9,
"coord_origin": "TOPLEFT"
},
"text": "it is trained",
"orig": "it is trained",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 300.8,
"r_x1": 211.4,
"r_y1": 300.8,
"r_x2": 211.4,
"r_y2": 291.9,
"r_x3": 50.1,
"r_y3": 291.9,
"coord_origin": "TOPLEFT"
},
"text": "with a combination of losses denoted as",
"orig": "with a combination of losses denoted as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 214.3,
"r_y0": 300.5,
"r_x1": 229.2,
"r_y1": 300.5,
"r_x2": 229.2,
"r_y2": 291.7,
"r_x3": 214.3,
"r_y3": 291.7,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.7,
"r_y0": 300.8,
"r_x1": 232.2,
"r_y1": 300.8,
"r_x2": 232.2,
"r_y2": 291.9,
"r_x3": 229.7,
"r_y3": 291.9,
"coord_origin": "TOPLEFT"
},
"text": ".",
"orig": ".",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 236.5,
"r_y0": 300.5,
"r_x1": 251.4,
"r_y1": 300.5,
"r_x2": 251.4,
"r_y2": 291.7,
"r_x3": 236.5,
"r_y3": 291.7,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 254.8,
"r_y0": 300.8,
"r_x1": 286.4,
"r_y1": 300.8,
"r_x2": 286.4,
"r_y2": 291.9,
"r_x3": 254.8,
"r_y3": 291.9,
"coord_origin": "TOPLEFT"
},
"text": "consists",
"orig": "consists",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 312.7,
"r_x1": 137.5,
"r_y1": 312.7,
"r_x2": 137.5,
"r_y2": 303.8,
"r_x3": 50.1,
"r_y3": 303.8,
"coord_origin": "TOPLEFT"
},
"text": "of the generally used",
"orig": "of the generally used",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 141.3,
"r_y0": 312.5,
"r_x1": 148.2,
"r_y1": 312.5,
"r_x2": 148.2,
"r_y2": 303.7,
"r_x3": 141.3,
"r_y3": 303.7,
"coord_origin": "TOPLEFT"
},
"text": "l$_{1}$",
"orig": "l$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 152.6,
"r_y0": 312.7,
"r_x1": 286.4,
"r_y1": 312.7,
"r_x2": 286.4,
"r_y2": 303.8,
"r_x3": 152.6,
"r_y3": 303.8,
"coord_origin": "TOPLEFT"
},
"text": "loss for object detection and the",
"orig": "loss for object detection and the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 324.7,
"r_x1": 89.7,
"r_y1": 324.7,
"r_x2": 89.7,
"r_y2": 315.8,
"r_x3": 50.1,
"r_y3": 315.8,
"coord_origin": "TOPLEFT"
},
"text": "IoU loss (",
"orig": "IoU loss (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.7,
"r_y0": 324.5,
"r_x1": 104.1,
"r_y1": 324.5,
"r_x2": 104.1,
"r_y2": 315.6,
"r_x3": 89.7,
"r_y3": 315.6,
"coord_origin": "TOPLEFT"
},
"text": "l$_{iou}$",
"orig": "l$_{iou}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 104.6,
"r_y0": 324.7,
"r_x1": 286.4,
"r_y1": 324.7,
"r_x2": 286.4,
"r_y2": 315.8,
"r_x3": 104.6,
"r_y3": 315.8,
"coord_origin": "TOPLEFT"
},
"text": ") to be scale invariant as explained in [25]. In",
"orig": ") to be scale invariant as explained in [25]. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 336.6,
"r_x1": 286.4,
"r_y1": 336.6,
"r_x2": 286.4,
"r_y2": 327.7,
"r_x3": 50.1,
"r_y3": 327.7,
"coord_origin": "TOPLEFT"
},
"text": "comparison to DETR, we do not use the Hungarian algo-",
"orig": "comparison to DETR, we do not use the Hungarian algo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 348.6,
"r_x1": 286.4,
"r_y1": 348.6,
"r_x2": 286.4,
"r_y2": 339.7,
"r_x3": 50.1,
"r_y3": 339.7,
"coord_origin": "TOPLEFT"
},
"text": "rithm [15] to match the predicted bounding boxes with the",
"orig": "rithm [15] to match the predicted bounding boxes with the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 360.5,
"r_x1": 286.4,
"r_y1": 360.5,
"r_x2": 286.4,
"r_y2": 351.6,
"r_x3": 50.1,
"r_y3": 351.6,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth boxes, as we have already achieved a one-to-",
"orig": "ground-truth boxes, as we have already achieved a one-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 372.5,
"r_x1": 286.4,
"r_y1": 372.5,
"r_x2": 286.4,
"r_y2": 363.6,
"r_x3": 50.1,
"r_y3": 363.6,
"coord_origin": "TOPLEFT"
},
"text": "one match through two steps: 1) Our token input sequence",
"orig": "one match through two steps: 1) Our token input sequence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 384.5,
"r_x1": 286.4,
"r_y1": 384.5,
"r_x2": 286.4,
"r_y2": 375.5,
"r_x3": 50.1,
"r_y3": 375.5,
"coord_origin": "TOPLEFT"
},
"text": "is naturally ordered, therefore the hidden states of the table",
"orig": "is naturally ordered, therefore the hidden states of the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 396.4,
"r_x1": 286.4,
"r_y1": 396.4,
"r_x2": 286.4,
"r_y2": 387.5,
"r_x3": 50.1,
"r_y3": 387.5,
"coord_origin": "TOPLEFT"
},
"text": "data cells are also in order when they are provided as in-",
"orig": "data cells are also in order when they are provided as in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 408.4,
"r_x1": 88.7,
"r_y1": 408.4,
"r_x2": 88.7,
"r_y2": 399.5,
"r_x3": 50.1,
"r_y3": 399.5,
"coord_origin": "TOPLEFT"
},
"text": "put to the",
"orig": "put to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.6,
"r_y0": 408.1,
"r_x1": 170.1,
"r_y1": 408.1,
"r_x2": 170.1,
"r_y2": 399.5,
"r_x3": 91.6,
"r_y3": 399.5,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 170.1,
"r_y0": 408.4,
"r_x1": 286.4,
"r_y1": 408.4,
"r_x2": 286.4,
"r_y2": 399.5,
"r_x3": 170.1,
"r_y3": 399.5,
"coord_origin": "TOPLEFT"
},
"text": ", and 2) Our bounding boxes",
"orig": ", and 2) Our bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 420.3,
"r_x1": 182.0,
"r_y1": 420.3,
"r_x2": 182.0,
"r_y2": 411.4,
"r_x3": 50.1,
"r_y3": 411.4,
"coord_origin": "TOPLEFT"
},
"text": "generation mechanism (see Sec.",
"orig": "generation mechanism (see Sec.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.1,
"r_y0": 420.3,
"r_x1": 197.7,
"r_y1": 420.3,
"r_x2": 197.7,
"r_y2": 411.4,
"r_x3": 189.1,
"r_y3": 411.4,
"coord_origin": "TOPLEFT"
},
"text": "3)",
"orig": "3)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.3,
"r_y0": 420.3,
"r_x1": 286.4,
"r_y1": 420.3,
"r_x2": 286.4,
"r_y2": 411.4,
"r_x3": 200.3,
"r_y3": 411.4,
"coord_origin": "TOPLEFT"
},
"text": "ensures a one-to-one",
"orig": "ensures a one-to-one",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 432.3,
"r_x1": 286.4,
"r_y1": 432.3,
"r_x2": 286.4,
"r_y2": 423.4,
"r_x3": 50.1,
"r_y3": 423.4,
"coord_origin": "TOPLEFT"
},
"text": "mapping between the cell content and its bounding box for",
"orig": "mapping between the cell content and its bounding box for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 444.2,
"r_x1": 158.3,
"r_y1": 444.2,
"r_x2": 158.3,
"r_y2": 435.3,
"r_x3": 50.1,
"r_y3": 435.3,
"coord_origin": "TOPLEFT"
},
"text": "all post-processed datasets.",
"orig": "all post-processed datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 11,
"label": "text",
"bbox": {
"l": 50.1,
"t": 448.0,
"r": 286.4,
"b": 468.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 456.9,
"r_x1": 286.4,
"r_y1": 456.9,
"r_x2": 286.4,
"r_y2": 448.0,
"r_x3": 62.1,
"r_y3": 448.0,
"coord_origin": "TOPLEFT"
},
"text": "The loss used to train the TableFormer can be defined as",
"orig": "The loss used to train the TableFormer can be defined as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 468.9,
"r_x1": 91.4,
"r_y1": 468.9,
"r_x2": 91.4,
"r_y2": 460.0,
"r_x3": 50.1,
"r_y3": 460.0,
"coord_origin": "TOPLEFT"
},
"text": "following:",
"orig": "following:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 15,
"label": "formula",
"bbox": {
"l": 124.3,
"t": 493.3,
"r": 286.4,
"b": 517.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.7,
"r_y0": 502.1,
"r_x1": 140.6,
"r_y1": 502.1,
"r_x2": 140.6,
"r_y2": 493.3,
"r_x3": 125.7,
"r_y3": 493.3,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.9,
"r_y0": 502.1,
"r_x1": 151.7,
"r_y1": 502.1,
"r_x2": 151.7,
"r_y2": 493.3,
"r_x3": 143.9,
"r_y3": 493.3,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 154.4,
"r_y0": 502.1,
"r_x1": 186.6,
"r_y1": 502.1,
"r_x2": 186.6,
"r_y2": 493.3,
"r_x3": 154.4,
"r_y3": 493.3,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{iou}$l$_{iou}$",
"orig": "\u03bb$_{iou}$l$_{iou}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.3,
"r_y0": 502.1,
"r_x1": 197.1,
"r_y1": 502.1,
"r_x2": 197.1,
"r_y2": 493.3,
"r_x3": 189.3,
"r_y3": 493.3,
"coord_origin": "TOPLEFT"
},
"text": "+",
"orig": "+",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 199.3,
"r_y0": 502.1,
"r_x1": 211.6,
"r_y1": 502.1,
"r_x2": 211.6,
"r_y2": 493.3,
"r_x3": 199.3,
"r_y3": 493.3,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{l}$$_{1}$",
"orig": "\u03bb$_{l}$$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 124.3,
"r_y0": 517.1,
"r_x1": 127.3,
"r_y1": 517.1,
"r_x2": 127.3,
"r_y2": 508.2,
"r_x3": 124.3,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "l",
"orig": "l",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 130.3,
"r_y0": 517.1,
"r_x1": 138.0,
"r_y1": 517.1,
"r_x2": 138.0,
"r_y2": 508.2,
"r_x3": 130.3,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.8,
"r_y0": 517.1,
"r_x1": 153.3,
"r_y1": 517.1,
"r_x2": 153.3,
"r_y2": 508.2,
"r_x3": 140.8,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "\u03bbl$_{s}$",
"orig": "\u03bbl$_{s}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 156.0,
"r_y0": 517.1,
"r_x1": 174.9,
"r_y1": 517.1,
"r_x2": 174.9,
"r_y2": 508.2,
"r_x3": 156.0,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "+ (1",
"orig": "+ (1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 177.1,
"r_y0": 517.1,
"r_x1": 184.8,
"r_y1": 517.1,
"r_x2": 184.8,
"r_y2": 507.7,
"r_x3": 177.1,
"r_y3": 507.7,
"coord_origin": "TOPLEFT"
},
"text": "\u2212",
"orig": "\u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.0,
"r_y0": 517.1,
"r_x1": 192.8,
"r_y1": 517.1,
"r_x2": 192.8,
"r_y2": 508.2,
"r_x3": 187.0,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 192.8,
"r_y0": 517.1,
"r_x1": 196.7,
"r_y1": 517.1,
"r_x2": 196.7,
"r_y2": 508.2,
"r_x3": 192.8,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.7,
"r_y0": 517.1,
"r_x1": 211.6,
"r_y1": 517.1,
"r_x2": 211.6,
"r_y2": 508.2,
"r_x3": 196.7,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.7,
"r_y0": 509.9,
"r_x1": 286.4,
"r_y1": 509.9,
"r_x2": 286.4,
"r_y2": 501.0,
"r_x3": 274.7,
"r_y3": 501.0,
"coord_origin": "TOPLEFT"
},
"text": "(1)",
"orig": "(1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 16,
"label": "text",
"bbox": {
"l": 50.1,
"t": 530.6,
"r": 281.6,
"b": 540.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 540.2,
"r_x1": 74.5,
"r_y1": 540.2,
"r_x2": 74.5,
"r_y2": 531.3,
"r_x3": 50.1,
"r_y3": 531.3,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.9,
"r_y0": 540.0,
"r_x1": 82.8,
"r_y1": 540.0,
"r_x2": 82.8,
"r_y2": 531.1,
"r_x3": 76.9,
"r_y3": 531.1,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 85.5,
"r_y0": 540.0,
"r_x1": 92.2,
"r_y1": 540.0,
"r_x2": 92.2,
"r_y2": 530.6,
"r_x3": 85.5,
"r_y3": 530.6,
"coord_origin": "TOPLEFT"
},
"text": "\u2208",
"orig": "\u2208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 94.7,
"r_y0": 540.2,
"r_x1": 135.6,
"r_y1": 540.2,
"r_x2": 135.6,
"r_y2": 531.3,
"r_x3": 94.7,
"r_y3": 531.3,
"coord_origin": "TOPLEFT"
},
"text": "[0, 1], and",
"orig": "[0, 1], and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.1,
"r_y0": 540.0,
"r_x1": 172.6,
"r_y1": 540.0,
"r_x2": 172.6,
"r_y2": 531.1,
"r_x3": 138.1,
"r_y3": 531.1,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$",
"orig": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.9,
"r_y0": 540.0,
"r_x1": 192.5,
"r_y1": 540.0,
"r_x2": 192.5,
"r_y2": 530.6,
"r_x3": 175.9,
"r_y3": 530.6,
"coord_origin": "TOPLEFT"
},
"text": "\u2208$_{R}$",
"orig": "\u2208$_{R}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 195.0,
"r_y0": 540.2,
"r_x1": 281.6,
"r_y1": 540.2,
"r_x2": 281.6,
"r_y2": 531.3,
"r_x3": 195.0,
"r_y3": 531.3,
"coord_origin": "TOPLEFT"
},
"text": "are hyper-parameters.",
"orig": "are hyper-parameters.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 12,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 555.9,
"r": 172.0,
"b": 566.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 566.7,
"r_x1": 57.9,
"r_y1": 566.7,
"r_x2": 57.9,
"r_y2": 555.9,
"r_x3": 50.1,
"r_y3": 555.9,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.4,
"r_y0": 566.7,
"r_x1": 172.0,
"r_y1": 566.7,
"r_x2": 172.0,
"r_y2": 555.9,
"r_x3": 68.4,
"r_y3": 555.9,
"coord_origin": "TOPLEFT"
},
"text": "Experimental Results",
"orig": "Experimental Results",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 13,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 576.3,
"r": 179.2,
"b": 586.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 586.1,
"r_x1": 64.7,
"r_y1": 586.1,
"r_x2": 64.7,
"r_y2": 576.3,
"r_x3": 50.1,
"r_y3": 576.3,
"coord_origin": "TOPLEFT"
},
"text": "5.1.",
"orig": "5.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.4,
"r_y0": 586.1,
"r_x1": 179.2,
"r_y1": 586.1,
"r_x2": 179.2,
"r_y2": 576.3,
"r_x3": 74.4,
"r_y3": 576.3,
"coord_origin": "TOPLEFT"
},
"text": "Implementation Details",
"orig": "Implementation Details",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 7,
"label": "text",
"bbox": {
"l": 50.1,
"t": 595.7,
"r": 286.4,
"b": 640.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 604.6,
"r_x1": 203.0,
"r_y1": 604.6,
"r_x2": 203.0,
"r_y2": 595.7,
"r_x3": 62.1,
"r_y3": 595.7,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer uses ResNet-18 as the",
"orig": "TableFormer uses ResNet-18 as the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 205.4,
"r_y0": 604.4,
"r_x1": 286.4,
"r_y1": 604.4,
"r_x2": 286.4,
"r_y2": 595.8,
"r_x3": 205.4,
"r_y3": 595.8,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Net-",
"orig": "CNN Backbone Net-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 616.4,
"r_x1": 70.0,
"r_y1": 616.4,
"r_x2": 70.0,
"r_y2": 607.8,
"r_x3": 50.1,
"r_y3": 607.8,
"coord_origin": "TOPLEFT"
},
"text": "work",
"orig": "work",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 616.6,
"r_x1": 286.4,
"r_y1": 616.6,
"r_x2": 286.4,
"r_y2": 607.7,
"r_x3": 70.0,
"r_y3": 607.7,
"coord_origin": "TOPLEFT"
},
"text": ". The input images are resized to 448*448 pixels and",
"orig": ". The input images are resized to 448*448 pixels and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 628.6,
"r_x1": 286.4,
"r_y1": 628.6,
"r_x2": 286.4,
"r_y2": 619.6,
"r_x3": 50.1,
"r_y3": 619.6,
"coord_origin": "TOPLEFT"
},
"text": "the feature map has a dimension of 28*28. Additionally, we",
"orig": "the feature map has a dimension of 28*28. Additionally, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 640.5,
"r_x1": 207.0,
"r_y1": 640.5,
"r_x2": 207.0,
"r_y2": 631.6,
"r_x3": 50.1,
"r_y3": 631.6,
"coord_origin": "TOPLEFT"
},
"text": "enforce the following input constraints:",
"orig": "enforce the following input constraints:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 18,
"label": "formula",
"bbox": {
"l": 91.7,
"t": 653.8,
"r": 286.4,
"b": 678.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.7,
"r_y0": 663.5,
"r_x1": 186.0,
"r_y1": 663.5,
"r_x2": 186.0,
"r_y2": 654.5,
"r_x3": 91.7,
"r_y3": 654.5,
"coord_origin": "TOPLEFT"
},
"text": "Image width and height",
"orig": "Image width and height",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.5,
"r_y0": 663.2,
"r_x1": 196.3,
"r_y1": 663.2,
"r_x2": 196.3,
"r_y2": 653.8,
"r_x3": 188.5,
"r_y3": 653.8,
"coord_origin": "TOPLEFT"
},
"text": "\u2264",
"orig": "\u2264",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 198.7,
"r_y0": 663.5,
"r_x1": 244.8,
"r_y1": 663.5,
"r_x2": 244.8,
"r_y2": 654.5,
"r_x3": 198.7,
"r_y3": 654.5,
"coord_origin": "TOPLEFT"
},
"text": "1024 pixels",
"orig": "1024 pixels",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.0,
"r_y0": 678.4,
"r_x1": 186.2,
"r_y1": 678.4,
"r_x2": 186.2,
"r_y2": 669.5,
"r_x3": 101.0,
"r_y3": 669.5,
"coord_origin": "TOPLEFT"
},
"text": "Structural tags length",
"orig": "Structural tags length",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.7,
"r_y0": 678.2,
"r_x1": 196.5,
"r_y1": 678.2,
"r_x2": 196.5,
"r_y2": 668.8,
"r_x3": 188.7,
"r_y3": 668.8,
"coord_origin": "TOPLEFT"
},
"text": "\u2264",
"orig": "\u2264",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 199.0,
"r_y0": 678.4,
"r_x1": 244.8,
"r_y1": 678.4,
"r_x2": 244.8,
"r_y2": 669.5,
"r_x3": 199.0,
"r_y3": 669.5,
"coord_origin": "TOPLEFT"
},
"text": "512 tokens.",
"orig": "512 tokens.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.7,
"r_y0": 671.0,
"r_x1": 286.4,
"r_y1": 671.0,
"r_x2": 286.4,
"r_y2": 662.1,
"r_x3": 274.7,
"r_y3": 662.1,
"coord_origin": "TOPLEFT"
},
"text": "(2)",
"orig": "(2)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 10,
"label": "text",
"bbox": {
"l": 50.1,
"t": 692.3,
"r": 286.4,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "Although input constraints are used also by other methods,",
"orig": "Although input constraints are used also by other methods,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 286.4,
"r_y1": 713.2,
"r_x2": 286.4,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "such as EDD, ours are less restrictive due to the improved",
"orig": "such as EDD, ours are less restrictive due to the improved",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 9,
"label": "text",
"bbox": {
"l": 308.9,
"t": 75.2,
"r": 545.1,
"b": 108.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 84.1,
"r_x1": 545.1,
"r_y1": 84.1,
"r_x2": 545.1,
"r_y2": 75.2,
"r_x3": 308.9,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "runtime performance and lower memory footprint of Table-",
"orig": "runtime performance and lower memory footprint of Table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 96.1,
"r_x1": 340.0,
"r_y1": 96.1,
"r_x2": 340.0,
"r_y2": 87.2,
"r_x3": 308.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "Former.",
"orig": "Former.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.9,
"r_y0": 96.1,
"r_x1": 545.1,
"r_y1": 96.1,
"r_x2": 545.1,
"r_y2": 87.2,
"r_x3": 346.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "This allows to utilize input samples with longer",
"orig": "This allows to utilize input samples with longer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 108.0,
"r_x1": 493.0,
"r_y1": 108.0,
"r_x2": 493.0,
"r_y2": 99.1,
"r_x3": 308.9,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "sequences and images with larger dimensions.",
"orig": "sequences and images with larger dimensions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "text",
"bbox": {
"l": 308.9,
"t": 116.2,
"r": 545.1,
"b": 328.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 125.1,
"r_x1": 545.1,
"r_y1": 125.1,
"r_x2": 545.1,
"r_y2": 116.2,
"r_x3": 320.8,
"r_y3": 116.2,
"coord_origin": "TOPLEFT"
},
"text": "The Transformer Encoder consists of two \u201cTransformer",
"orig": "The Transformer Encoder consists of two \u201cTransformer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 137.1,
"r_x1": 545.1,
"r_y1": 137.1,
"r_x2": 545.1,
"r_y2": 128.2,
"r_x3": 308.9,
"r_y3": 128.2,
"coord_origin": "TOPLEFT"
},
"text": "Encoder Layers\u201d, with an input feature size of 512, feed",
"orig": "Encoder Layers\u201d, with an input feature size of 512, feed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 149.0,
"r_x1": 545.1,
"r_y1": 149.0,
"r_x2": 545.1,
"r_y2": 140.1,
"r_x3": 308.9,
"r_y3": 140.1,
"coord_origin": "TOPLEFT"
},
"text": "forward network of 1024, and 4 attention heads. As for the",
"orig": "forward network of 1024, and 4 attention heads. As for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 161.0,
"r_x1": 545.1,
"r_y1": 161.0,
"r_x2": 545.1,
"r_y2": 152.1,
"r_x3": 308.9,
"r_y3": 152.1,
"coord_origin": "TOPLEFT"
},
"text": "Transformer Decoder it is composed of four \u201cTransformer",
"orig": "Transformer Decoder it is composed of four \u201cTransformer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 173.0,
"r_x1": 545.1,
"r_y1": 173.0,
"r_x2": 545.1,
"r_y2": 164.0,
"r_x3": 308.9,
"r_y3": 164.0,
"coord_origin": "TOPLEFT"
},
"text": "Decoder Layers\u201d with similar input and output dimensions",
"orig": "Decoder Layers\u201d with similar input and output dimensions",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 184.9,
"r_x1": 467.2,
"r_y1": 184.9,
"r_x2": 467.2,
"r_y2": 176.0,
"r_x3": 308.9,
"r_y3": 176.0,
"coord_origin": "TOPLEFT"
},
"text": "as the \u201cTransformer Encoder Layers\u201d.",
"orig": "as the \u201cTransformer Encoder Layers\u201d.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 475.4,
"r_y0": 184.9,
"r_x1": 545.1,
"r_y1": 184.9,
"r_x2": 545.1,
"r_y2": 176.0,
"r_x3": 475.4,
"r_y3": 176.0,
"coord_origin": "TOPLEFT"
},
"text": "Even though our",
"orig": "Even though our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 196.9,
"r_x1": 545.1,
"r_y1": 196.9,
"r_x2": 545.1,
"r_y2": 188.0,
"r_x3": 308.9,
"r_y3": 188.0,
"coord_origin": "TOPLEFT"
},
"text": "model uses fewer layers and heads than the default imple-",
"orig": "model uses fewer layers and heads than the default imple-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 208.8,
"r_x1": 545.1,
"r_y1": 208.8,
"r_x2": 545.1,
"r_y2": 199.9,
"r_x3": 308.9,
"r_y3": 199.9,
"coord_origin": "TOPLEFT"
},
"text": "mentation parameters, our extensive experimentation has",
"orig": "mentation parameters, our extensive experimentation has",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 220.8,
"r_x1": 545.1,
"r_y1": 220.8,
"r_x2": 545.1,
"r_y2": 211.9,
"r_x3": 308.9,
"r_y3": 211.9,
"coord_origin": "TOPLEFT"
},
"text": "proved this setup to be more suitable for table images. We",
"orig": "proved this setup to be more suitable for table images. We",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 232.7,
"r_x1": 545.1,
"r_y1": 232.7,
"r_x2": 545.1,
"r_y2": 223.8,
"r_x3": 308.9,
"r_y3": 223.8,
"coord_origin": "TOPLEFT"
},
"text": "attribute this finding to the inherent design of table im-",
"orig": "attribute this finding to the inherent design of table im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 244.7,
"r_x1": 545.1,
"r_y1": 244.7,
"r_x2": 545.1,
"r_y2": 235.8,
"r_x3": 308.9,
"r_y3": 235.8,
"coord_origin": "TOPLEFT"
},
"text": "ages, which contain mostly lines and text, unlike the more",
"orig": "ages, which contain mostly lines and text, unlike the more",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 256.6,
"r_x1": 545.1,
"r_y1": 256.6,
"r_x2": 545.1,
"r_y2": 247.7,
"r_x3": 308.9,
"r_y3": 247.7,
"coord_origin": "TOPLEFT"
},
"text": "elaborate content present in other scopes (e.g. the COCO",
"orig": "elaborate content present in other scopes (e.g. the COCO",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 268.6,
"r_x1": 342.3,
"r_y1": 268.6,
"r_x2": 342.3,
"r_y2": 259.7,
"r_x3": 308.9,
"r_y3": 259.7,
"coord_origin": "TOPLEFT"
},
"text": "dataset).",
"orig": "dataset).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 349.0,
"r_y0": 268.6,
"r_x1": 545.1,
"r_y1": 268.6,
"r_x2": 545.1,
"r_y2": 259.7,
"r_x3": 349.0,
"r_y3": 259.7,
"coord_origin": "TOPLEFT"
},
"text": "Moreover, we have added ResNet blocks to the",
"orig": "Moreover, we have added ResNet blocks to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 280.6,
"r_x1": 545.1,
"r_y1": 280.6,
"r_x2": 545.1,
"r_y2": 271.6,
"r_x3": 308.9,
"r_y3": 271.6,
"coord_origin": "TOPLEFT"
},
"text": "inputs of the Structure Decoder and Cell BBox Decoder.",
"orig": "inputs of the Structure Decoder and Cell BBox Decoder.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 292.5,
"r_x1": 545.1,
"r_y1": 292.5,
"r_x2": 545.1,
"r_y2": 283.6,
"r_x3": 308.9,
"r_y3": 283.6,
"coord_origin": "TOPLEFT"
},
"text": "This prevents a decoder having a stronger influence over the",
"orig": "This prevents a decoder having a stronger influence over the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 304.5,
"r_x1": 545.1,
"r_y1": 304.5,
"r_x2": 545.1,
"r_y2": 295.6,
"r_x3": 308.9,
"r_y3": 295.6,
"coord_origin": "TOPLEFT"
},
"text": "learned weights which would damage the other prediction",
"orig": "learned weights which would damage the other prediction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 316.4,
"r_x1": 545.1,
"r_y1": 316.4,
"r_x2": 545.1,
"r_y2": 307.5,
"r_x3": 308.9,
"r_y3": 307.5,
"coord_origin": "TOPLEFT"
},
"text": "task (structure vs bounding boxes), but learn task specific",
"orig": "task (structure vs bounding boxes), but learn task specific",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 328.4,
"r_x1": 532.5,
"r_y1": 328.4,
"r_x2": 532.5,
"r_y2": 319.5,
"r_x3": 308.9,
"r_y3": 319.5,
"coord_origin": "TOPLEFT"
},
"text": "weights instead. Lastly our dropout layers are set to 0.5.",
"orig": "weights instead. Lastly our dropout layers are set to 0.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "text",
"bbox": {
"l": 308.9,
"t": 336.6,
"r": 545.1,
"b": 429.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 345.5,
"r_x1": 545.1,
"r_y1": 345.5,
"r_x2": 545.1,
"r_y2": 336.6,
"r_x3": 320.8,
"r_y3": 336.6,
"coord_origin": "TOPLEFT"
},
"text": "For training, TableFormer is trained with 3 Adam opti-",
"orig": "For training, TableFormer is trained with 3 Adam opti-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 357.4,
"r_x1": 403.7,
"r_y1": 357.4,
"r_x2": 403.7,
"r_y2": 348.5,
"r_x3": 308.9,
"r_y3": 348.5,
"coord_origin": "TOPLEFT"
},
"text": "mizers, each one for the",
"orig": "mizers, each one for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.1,
"r_y0": 357.2,
"r_x1": 503.5,
"r_y1": 357.2,
"r_x2": 503.5,
"r_y2": 348.6,
"r_x3": 406.1,
"r_y3": 348.6,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network",
"orig": "CNN Backbone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 503.5,
"r_y0": 357.4,
"r_x1": 506.0,
"r_y1": 357.4,
"r_x2": 506.0,
"r_y2": 348.5,
"r_x3": 503.5,
"r_y3": 348.5,
"coord_origin": "TOPLEFT"
},
"text": ",",
"orig": ",",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.4,
"r_y0": 357.2,
"r_x1": 545.1,
"r_y1": 357.2,
"r_x2": 545.1,
"r_y2": 348.6,
"r_x3": 508.4,
"r_y3": 348.6,
"coord_origin": "TOPLEFT"
},
"text": "Structure",
"orig": "Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 369.2,
"r_x1": 343.2,
"r_y1": 369.2,
"r_x2": 343.2,
"r_y2": 360.6,
"r_x3": 308.9,
"r_y3": 360.6,
"coord_origin": "TOPLEFT"
},
"text": "Decoder",
"orig": "Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 343.2,
"r_y0": 369.4,
"r_x1": 362.2,
"r_y1": 369.4,
"r_x2": 362.2,
"r_y2": 360.5,
"r_x3": 343.2,
"r_y3": 360.5,
"coord_origin": "TOPLEFT"
},
"text": ", and",
"orig": ", and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 364.3,
"r_y0": 369.2,
"r_x1": 440.9,
"r_y1": 369.2,
"r_x2": 440.9,
"r_y2": 360.6,
"r_x3": 364.3,
"r_y3": 360.6,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.9,
"r_y0": 369.4,
"r_x1": 545.1,
"r_y1": 369.4,
"r_x2": 545.1,
"r_y2": 360.5,
"r_x3": 440.9,
"r_y3": 360.5,
"coord_origin": "TOPLEFT"
},
"text": ". Taking the PubTabNet as",
"orig": ". Taking the PubTabNet as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 381.3,
"r_x1": 545.1,
"r_y1": 381.3,
"r_x2": 545.1,
"r_y2": 372.4,
"r_x3": 308.9,
"r_y3": 372.4,
"coord_origin": "TOPLEFT"
},
"text": "an example for our parameter set up, the initializing learn-",
"orig": "an example for our parameter set up, the initializing learn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 393.3,
"r_x1": 545.1,
"r_y1": 393.3,
"r_x2": 545.1,
"r_y2": 384.4,
"r_x3": 308.9,
"r_y3": 384.4,
"coord_origin": "TOPLEFT"
},
"text": "ing rate is 0.001 for 12 epochs with a batch size of 24, and",
"orig": "ing rate is 0.001 for 12 epochs with a batch size of 24, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 405.0,
"r_x1": 314.7,
"r_y1": 405.0,
"r_x2": 314.7,
"r_y2": 396.2,
"r_x3": 308.9,
"r_y3": 396.2,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.7,
"r_y0": 405.3,
"r_x1": 360.4,
"r_y1": 405.3,
"r_x2": 360.4,
"r_y2": 396.4,
"r_x3": 318.7,
"r_y3": 396.4,
"coord_origin": "TOPLEFT"
},
"text": "set to 0.5.",
"orig": "set to 0.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 368.0,
"r_y0": 405.3,
"r_x1": 545.1,
"r_y1": 405.3,
"r_x2": 545.1,
"r_y2": 396.4,
"r_x3": 368.0,
"r_y3": 396.4,
"coord_origin": "TOPLEFT"
},
"text": "Afterwards, we reduce the learning rate to",
"orig": "Afterwards, we reduce the learning rate to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 417.2,
"r_x1": 545.1,
"r_y1": 417.2,
"r_x2": 545.1,
"r_y2": 408.3,
"r_x3": 308.9,
"r_y3": 408.3,
"coord_origin": "TOPLEFT"
},
"text": "0.0001, the batch size to 18 and train for 12 more epochs or",
"orig": "0.0001, the batch size to 18 and train for 12 more epochs or",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 429.2,
"r_x1": 361.0,
"r_y1": 429.2,
"r_x2": 361.0,
"r_y2": 420.3,
"r_x3": 308.9,
"r_y3": 420.3,
"coord_origin": "TOPLEFT"
},
"text": "convergence.",
"orig": "convergence.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 0,
"label": "text",
"bbox": {
"l": 308.9,
"t": 437.4,
"r": 545.1,
"b": 553.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 446.3,
"r_x1": 545.1,
"r_y1": 446.3,
"r_x2": 545.1,
"r_y2": 437.4,
"r_x3": 320.8,
"r_y3": 437.4,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer is implemented with PyTorch and Torchvi-",
"orig": "TableFormer is implemented with PyTorch and Torchvi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 458.2,
"r_x1": 384.6,
"r_y1": 458.2,
"r_x2": 384.6,
"r_y2": 449.3,
"r_x3": 308.9,
"r_y3": 449.3,
"coord_origin": "TOPLEFT"
},
"text": "sion libraries [22].",
"orig": "sion libraries [22].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.4,
"r_y0": 458.2,
"r_x1": 545.1,
"r_y1": 458.2,
"r_x2": 545.1,
"r_y2": 449.3,
"r_x3": 391.4,
"r_y3": 449.3,
"coord_origin": "TOPLEFT"
},
"text": "To speed up the inference, the image",
"orig": "To speed up the inference, the image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 470.2,
"r_x1": 494.0,
"r_y1": 470.2,
"r_x2": 494.0,
"r_y2": 461.3,
"r_x3": 308.9,
"r_y3": 461.3,
"coord_origin": "TOPLEFT"
},
"text": "undergoes a single forward pass through the",
"orig": "undergoes a single forward pass through the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.1,
"r_y0": 470.0,
"r_x1": 545.1,
"r_y1": 470.0,
"r_x2": 545.1,
"r_y2": 461.4,
"r_x3": 498.1,
"r_y3": 461.4,
"coord_origin": "TOPLEFT"
},
"text": "CNN Back-",
"orig": "CNN Back-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 481.9,
"r_x1": 364.4,
"r_y1": 481.9,
"r_x2": 364.4,
"r_y2": 473.3,
"r_x3": 308.9,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "bone Network",
"orig": "bone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.1,
"r_y0": 482.1,
"r_x1": 545.1,
"r_y1": 482.1,
"r_x2": 545.1,
"r_y2": 473.2,
"r_x3": 367.1,
"r_y3": 473.2,
"coord_origin": "TOPLEFT"
},
"text": "and transformer encoder. This eliminates the",
"orig": "and transformer encoder. This eliminates the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 494.1,
"r_x1": 545.1,
"r_y1": 494.1,
"r_x2": 545.1,
"r_y2": 485.2,
"r_x3": 308.9,
"r_y3": 485.2,
"coord_origin": "TOPLEFT"
},
"text": "overhead of generating the same features for each decoding",
"orig": "overhead of generating the same features for each decoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 506.1,
"r_x1": 545.1,
"r_y1": 506.1,
"r_x2": 545.1,
"r_y2": 497.1,
"r_x3": 308.9,
"r_y3": 497.1,
"coord_origin": "TOPLEFT"
},
"text": "step. Similarly, we employ a \u2019caching\u2019 technique to preform",
"orig": "step. Similarly, we employ a \u2019caching\u2019 technique to preform",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 518.0,
"r_x1": 545.1,
"r_y1": 518.0,
"r_x2": 545.1,
"r_y2": 509.1,
"r_x3": 308.9,
"r_y3": 509.1,
"coord_origin": "TOPLEFT"
},
"text": "faster autoregressive decoding. This is achieved by storing",
"orig": "faster autoregressive decoding. This is achieved by storing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 530.0,
"r_x1": 545.1,
"r_y1": 530.0,
"r_x2": 545.1,
"r_y2": 521.1,
"r_x3": 308.9,
"r_y3": 521.1,
"coord_origin": "TOPLEFT"
},
"text": "the features of decoded tokens so we can reuse them for",
"orig": "the features of decoded tokens so we can reuse them for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 541.9,
"r_x1": 545.1,
"r_y1": 541.9,
"r_x2": 545.1,
"r_y2": 533.0,
"r_x3": 308.9,
"r_y3": 533.0,
"coord_origin": "TOPLEFT"
},
"text": "each time step. Therefore, we only compute the attention",
"orig": "each time step. Therefore, we only compute the attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 553.9,
"r_x1": 377.2,
"r_y1": 553.9,
"r_x2": 377.2,
"r_y2": 545.0,
"r_x3": 308.9,
"r_y3": 545.0,
"coord_origin": "TOPLEFT"
},
"text": "for each new tag.",
"orig": "for each new tag.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 14,
"label": "section_header",
"bbox": {
"l": 308.9,
"t": 579.6,
"r": 397.4,
"b": 589.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 589.4,
"r_x1": 323.9,
"r_y1": 589.4,
"r_x2": 323.9,
"r_y2": 579.6,
"r_x3": 308.9,
"r_y3": 579.6,
"coord_origin": "TOPLEFT"
},
"text": "5.2.",
"orig": "5.2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.9,
"r_y0": 589.4,
"r_x1": 397.4,
"r_y1": 589.4,
"r_x2": 397.4,
"r_y2": 579.6,
"r_x3": 333.9,
"r_y3": 579.6,
"coord_origin": "TOPLEFT"
},
"text": "Generalization",
"orig": "Generalization",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "text",
"bbox": {
"l": 308.9,
"t": 603.4,
"r": 545.1,
"b": 672.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 612.4,
"r_x1": 545.1,
"r_y1": 612.4,
"r_x2": 545.1,
"r_y2": 603.4,
"r_x3": 320.8,
"r_y3": 603.4,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer is evaluated on three major publicly avail-",
"orig": "TableFormer is evaluated on three major publicly avail-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 624.3,
"r_x1": 545.1,
"r_y1": 624.3,
"r_x2": 545.1,
"r_y2": 615.4,
"r_x3": 308.9,
"r_y3": 615.4,
"coord_origin": "TOPLEFT"
},
"text": "able datasets of different nature to prove the generalization",
"orig": "able datasets of different nature to prove the generalization",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 636.3,
"r_x1": 545.1,
"r_y1": 636.3,
"r_x2": 545.1,
"r_y2": 627.4,
"r_x3": 308.9,
"r_y3": 627.4,
"coord_origin": "TOPLEFT"
},
"text": "and effectiveness of our model. The datasets used for eval-",
"orig": "and effectiveness of our model. The datasets used for eval-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 648.2,
"r_x1": 545.1,
"r_y1": 648.2,
"r_x2": 545.1,
"r_y2": 639.3,
"r_x3": 308.9,
"r_y3": 639.3,
"coord_origin": "TOPLEFT"
},
"text": "uation are the PubTabNet, FinTabNet and TableBank which",
"orig": "uation are the PubTabNet, FinTabNet and TableBank which",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 660.2,
"r_x1": 545.1,
"r_y1": 660.2,
"r_x2": 545.1,
"r_y2": 651.3,
"r_x3": 308.9,
"r_y3": 651.3,
"coord_origin": "TOPLEFT"
},
"text": "stem from the scientific, financial and general domains re-",
"orig": "stem from the scientific, financial and general domains re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 672.1,
"r_x1": 350.7,
"r_y1": 672.1,
"r_x2": 350.7,
"r_y2": 663.2,
"r_x3": 308.9,
"r_y3": 663.2,
"coord_origin": "TOPLEFT"
},
"text": "spectively.",
"orig": "spectively.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 8,
"label": "text",
"bbox": {
"l": 308.9,
"t": 680.3,
"r": 545.1,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 689.2,
"r_x1": 545.1,
"r_y1": 689.2,
"r_x2": 545.1,
"r_y2": 680.3,
"r_x3": 320.8,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "We also share our baseline results on the challenging",
"orig": "We also share our baseline results on the challenging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 701.2,
"r_x1": 396.2,
"r_y1": 701.2,
"r_x2": 396.2,
"r_y2": 692.3,
"r_x3": 308.9,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet dataset.",
"orig": "SynthTabNet dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.4,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 406.4,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "Throughout our experiments, the",
"orig": "Throughout our experiments, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 495.9,
"r_y1": 713.2,
"r_x2": 495.9,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "same parameters stated in Sec. 5.1 are utilized.",
"orig": "same parameters stated in Sec. 5.1 are utilized.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 17,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"tablestructure": {
"table_map": {}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "text",
"id": 5,
"page_no": 5,
"cluster": {
"id": 5,
"label": "text",
"bbox": {
"l": 50.1,
"t": 75.2,
"r": 286.4,
"b": 155.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.1,
"r_x1": 286.4,
"r_y1": 84.1,
"r_x2": 286.4,
"r_y2": 75.2,
"r_x3": 50.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "tention encoding is then multiplied to the encoded image to",
"orig": "tention encoding is then multiplied to the encoded image to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 96.1,
"r_x1": 286.4,
"r_y1": 96.1,
"r_x2": 286.4,
"r_y2": 87.2,
"r_x3": 50.1,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "produce a feature for each table cell. Notice that this is dif-",
"orig": "produce a feature for each table cell. Notice that this is dif-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 108.0,
"r_x1": 286.4,
"r_y1": 108.0,
"r_x2": 286.4,
"r_y2": 99.1,
"r_x3": 50.1,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "ferent than the typical object detection problem where im-",
"orig": "ferent than the typical object detection problem where im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 120.0,
"r_x1": 286.4,
"r_y1": 120.0,
"r_x2": 286.4,
"r_y2": 111.1,
"r_x3": 50.1,
"r_y3": 111.1,
"coord_origin": "TOPLEFT"
},
"text": "balances between the number of detections and the amount",
"orig": "balances between the number of detections and the amount",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 131.9,
"r_x1": 286.4,
"r_y1": 131.9,
"r_x2": 286.4,
"r_y2": 123.0,
"r_x3": 50.1,
"r_y3": 123.0,
"coord_origin": "TOPLEFT"
},
"text": "of objects may exist. In our case, we know up front that",
"orig": "of objects may exist. In our case, we know up front that",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 143.9,
"r_x1": 286.4,
"r_y1": 143.9,
"r_x2": 286.4,
"r_y2": 135.0,
"r_x3": 50.1,
"r_y3": 135.0,
"coord_origin": "TOPLEFT"
},
"text": "the produced detections always match with the table cells",
"orig": "the produced detections always match with the table cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 155.8,
"r_x1": 175.2,
"r_y1": 155.8,
"r_x2": 175.2,
"r_y2": 146.9,
"r_x3": 50.1,
"r_y3": 146.9,
"coord_origin": "TOPLEFT"
},
"text": "in number and correspondence.",
"orig": "in number and correspondence.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "tention encoding is then multiplied to the encoded image to produce a feature for each table cell. Notice that this is different than the typical object detection problem where imbalances between the number of detections and the amount of objects may exist. In our case, we know up front that the produced detections always match with the table cells in number and correspondence."
},
{
"label": "text",
"id": 6,
"page_no": 5,
"cluster": {
"id": 6,
"label": "text",
"bbox": {
"l": 50.1,
"t": 159.6,
"r": 286.4,
"b": 240.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 168.5,
"r_x1": 286.4,
"r_y1": 168.5,
"r_x2": 286.4,
"r_y2": 159.6,
"r_x3": 62.1,
"r_y3": 159.6,
"coord_origin": "TOPLEFT"
},
"text": "The output features for each table cell are then fed",
"orig": "The output features for each table cell are then fed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 180.5,
"r_x1": 286.4,
"r_y1": 180.5,
"r_x2": 286.4,
"r_y2": 171.6,
"r_x3": 50.1,
"r_y3": 171.6,
"coord_origin": "TOPLEFT"
},
"text": "into the feed-forward network (FFN). The FFN consists",
"orig": "into the feed-forward network (FFN). The FFN consists",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 192.4,
"r_x1": 286.4,
"r_y1": 192.4,
"r_x2": 286.4,
"r_y2": 183.5,
"r_x3": 50.1,
"r_y3": 183.5,
"coord_origin": "TOPLEFT"
},
"text": "of a Multi-Layer Perceptron (3 layers with ReLU activa-",
"orig": "of a Multi-Layer Perceptron (3 layers with ReLU activa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 204.4,
"r_x1": 286.4,
"r_y1": 204.4,
"r_x2": 286.4,
"r_y2": 195.5,
"r_x3": 50.1,
"r_y3": 195.5,
"coord_origin": "TOPLEFT"
},
"text": "tion function) that predicts the normalized coordinates for",
"orig": "tion function) that predicts the normalized coordinates for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 216.4,
"r_x1": 286.4,
"r_y1": 216.4,
"r_x2": 286.4,
"r_y2": 207.4,
"r_x3": 50.1,
"r_y3": 207.4,
"coord_origin": "TOPLEFT"
},
"text": "the bounding box of each table cell. Finally, the predicted",
"orig": "the bounding box of each table cell. Finally, the predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 228.3,
"r_x1": 286.4,
"r_y1": 228.3,
"r_x2": 286.4,
"r_y2": 219.4,
"r_x3": 50.1,
"r_y3": 219.4,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes are classified based on whether they are",
"orig": "bounding boxes are classified based on whether they are",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 240.3,
"r_x1": 181.5,
"r_y1": 240.3,
"r_x2": 181.5,
"r_y2": 231.4,
"r_x3": 50.1,
"r_y3": 231.4,
"coord_origin": "TOPLEFT"
},
"text": "empty or not using a linear layer.",
"orig": "empty or not using a linear layer.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The output features for each table cell are then fed into the feed-forward network (FFN). The FFN consists of a Multi-Layer Perceptron (3 layers with ReLU activation function) that predicts the normalized coordinates for the bounding box of each table cell. Finally, the predicted bounding boxes are classified based on whether they are empty or not using a linear layer."
},
{
"label": "text",
"id": 4,
"page_no": 5,
"cluster": {
"id": 4,
"label": "text",
"bbox": {
"l": 50.1,
"t": 243.9,
"r": 286.4,
"b": 444.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 252.9,
"r_x1": 129.2,
"r_y1": 252.9,
"r_x2": 129.2,
"r_y2": 243.9,
"r_x3": 62.1,
"r_y3": 243.9,
"coord_origin": "TOPLEFT"
},
"text": "Loss Functions.",
"orig": "Loss Functions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.5,
"r_y0": 252.9,
"r_x1": 286.4,
"r_y1": 252.9,
"r_x2": 286.4,
"r_y2": 244.0,
"r_x3": 134.5,
"r_y3": 244.0,
"coord_origin": "TOPLEFT"
},
"text": "We formulate a multi-task loss Eq. 2",
"orig": "We formulate a multi-task loss Eq. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 264.9,
"r_x1": 286.4,
"r_y1": 264.9,
"r_x2": 286.4,
"r_y2": 256.0,
"r_x3": 50.1,
"r_y3": 256.0,
"coord_origin": "TOPLEFT"
},
"text": "to train our network. The Cross-Entropy loss (denoted as",
"orig": "to train our network. The Cross-Entropy loss (denoted as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 276.6,
"r_x1": 56.8,
"r_y1": 276.6,
"r_x2": 56.8,
"r_y2": 267.8,
"r_x3": 50.1,
"r_y3": 267.8,
"coord_origin": "TOPLEFT"
},
"text": "l$_{s}$",
"orig": "l$_{s}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 57.3,
"r_y0": 276.9,
"r_x1": 135.4,
"r_y1": 276.9,
"r_x2": 135.4,
"r_y2": 268.0,
"r_x3": 57.3,
"r_y3": 268.0,
"coord_origin": "TOPLEFT"
},
"text": ") is used to train the",
"orig": ") is used to train the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.7,
"r_y0": 276.6,
"r_x1": 211.1,
"r_y1": 276.6,
"r_x2": 211.1,
"r_y2": 268.0,
"r_x3": 137.7,
"r_y3": 268.0,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 213.6,
"r_y0": 276.9,
"r_x1": 286.4,
"r_y1": 276.9,
"r_x2": 286.4,
"r_y2": 268.0,
"r_x3": 213.6,
"r_y3": 268.0,
"coord_origin": "TOPLEFT"
},
"text": "which predicts the",
"orig": "which predicts the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 288.8,
"r_x1": 158.8,
"r_y1": 288.8,
"r_x2": 158.8,
"r_y2": 279.9,
"r_x3": 50.1,
"r_y3": 279.9,
"coord_origin": "TOPLEFT"
},
"text": "structure tokens. As for the",
"orig": "structure tokens. As for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 161.3,
"r_y0": 288.6,
"r_x1": 238.8,
"r_y1": 288.6,
"r_x2": 238.8,
"r_y2": 280.0,
"r_x3": 161.3,
"r_y3": 280.0,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.5,
"r_y0": 288.8,
"r_x1": 286.4,
"r_y1": 288.8,
"r_x2": 286.4,
"r_y2": 279.9,
"r_x3": 241.5,
"r_y3": 279.9,
"coord_origin": "TOPLEFT"
},
"text": "it is trained",
"orig": "it is trained",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 300.8,
"r_x1": 211.4,
"r_y1": 300.8,
"r_x2": 211.4,
"r_y2": 291.9,
"r_x3": 50.1,
"r_y3": 291.9,
"coord_origin": "TOPLEFT"
},
"text": "with a combination of losses denoted as",
"orig": "with a combination of losses denoted as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 214.3,
"r_y0": 300.5,
"r_x1": 229.2,
"r_y1": 300.5,
"r_x2": 229.2,
"r_y2": 291.7,
"r_x3": 214.3,
"r_y3": 291.7,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.7,
"r_y0": 300.8,
"r_x1": 232.2,
"r_y1": 300.8,
"r_x2": 232.2,
"r_y2": 291.9,
"r_x3": 229.7,
"r_y3": 291.9,
"coord_origin": "TOPLEFT"
},
"text": ".",
"orig": ".",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 236.5,
"r_y0": 300.5,
"r_x1": 251.4,
"r_y1": 300.5,
"r_x2": 251.4,
"r_y2": 291.7,
"r_x3": 236.5,
"r_y3": 291.7,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 254.8,
"r_y0": 300.8,
"r_x1": 286.4,
"r_y1": 300.8,
"r_x2": 286.4,
"r_y2": 291.9,
"r_x3": 254.8,
"r_y3": 291.9,
"coord_origin": "TOPLEFT"
},
"text": "consists",
"orig": "consists",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 312.7,
"r_x1": 137.5,
"r_y1": 312.7,
"r_x2": 137.5,
"r_y2": 303.8,
"r_x3": 50.1,
"r_y3": 303.8,
"coord_origin": "TOPLEFT"
},
"text": "of the generally used",
"orig": "of the generally used",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 141.3,
"r_y0": 312.5,
"r_x1": 148.2,
"r_y1": 312.5,
"r_x2": 148.2,
"r_y2": 303.7,
"r_x3": 141.3,
"r_y3": 303.7,
"coord_origin": "TOPLEFT"
},
"text": "l$_{1}$",
"orig": "l$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 152.6,
"r_y0": 312.7,
"r_x1": 286.4,
"r_y1": 312.7,
"r_x2": 286.4,
"r_y2": 303.8,
"r_x3": 152.6,
"r_y3": 303.8,
"coord_origin": "TOPLEFT"
},
"text": "loss for object detection and the",
"orig": "loss for object detection and the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 324.7,
"r_x1": 89.7,
"r_y1": 324.7,
"r_x2": 89.7,
"r_y2": 315.8,
"r_x3": 50.1,
"r_y3": 315.8,
"coord_origin": "TOPLEFT"
},
"text": "IoU loss (",
"orig": "IoU loss (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.7,
"r_y0": 324.5,
"r_x1": 104.1,
"r_y1": 324.5,
"r_x2": 104.1,
"r_y2": 315.6,
"r_x3": 89.7,
"r_y3": 315.6,
"coord_origin": "TOPLEFT"
},
"text": "l$_{iou}$",
"orig": "l$_{iou}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 104.6,
"r_y0": 324.7,
"r_x1": 286.4,
"r_y1": 324.7,
"r_x2": 286.4,
"r_y2": 315.8,
"r_x3": 104.6,
"r_y3": 315.8,
"coord_origin": "TOPLEFT"
},
"text": ") to be scale invariant as explained in [25]. In",
"orig": ") to be scale invariant as explained in [25]. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 336.6,
"r_x1": 286.4,
"r_y1": 336.6,
"r_x2": 286.4,
"r_y2": 327.7,
"r_x3": 50.1,
"r_y3": 327.7,
"coord_origin": "TOPLEFT"
},
"text": "comparison to DETR, we do not use the Hungarian algo-",
"orig": "comparison to DETR, we do not use the Hungarian algo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 348.6,
"r_x1": 286.4,
"r_y1": 348.6,
"r_x2": 286.4,
"r_y2": 339.7,
"r_x3": 50.1,
"r_y3": 339.7,
"coord_origin": "TOPLEFT"
},
"text": "rithm [15] to match the predicted bounding boxes with the",
"orig": "rithm [15] to match the predicted bounding boxes with the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 360.5,
"r_x1": 286.4,
"r_y1": 360.5,
"r_x2": 286.4,
"r_y2": 351.6,
"r_x3": 50.1,
"r_y3": 351.6,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth boxes, as we have already achieved a one-to-",
"orig": "ground-truth boxes, as we have already achieved a one-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 372.5,
"r_x1": 286.4,
"r_y1": 372.5,
"r_x2": 286.4,
"r_y2": 363.6,
"r_x3": 50.1,
"r_y3": 363.6,
"coord_origin": "TOPLEFT"
},
"text": "one match through two steps: 1) Our token input sequence",
"orig": "one match through two steps: 1) Our token input sequence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 384.5,
"r_x1": 286.4,
"r_y1": 384.5,
"r_x2": 286.4,
"r_y2": 375.5,
"r_x3": 50.1,
"r_y3": 375.5,
"coord_origin": "TOPLEFT"
},
"text": "is naturally ordered, therefore the hidden states of the table",
"orig": "is naturally ordered, therefore the hidden states of the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 396.4,
"r_x1": 286.4,
"r_y1": 396.4,
"r_x2": 286.4,
"r_y2": 387.5,
"r_x3": 50.1,
"r_y3": 387.5,
"coord_origin": "TOPLEFT"
},
"text": "data cells are also in order when they are provided as in-",
"orig": "data cells are also in order when they are provided as in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 408.4,
"r_x1": 88.7,
"r_y1": 408.4,
"r_x2": 88.7,
"r_y2": 399.5,
"r_x3": 50.1,
"r_y3": 399.5,
"coord_origin": "TOPLEFT"
},
"text": "put to the",
"orig": "put to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.6,
"r_y0": 408.1,
"r_x1": 170.1,
"r_y1": 408.1,
"r_x2": 170.1,
"r_y2": 399.5,
"r_x3": 91.6,
"r_y3": 399.5,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 170.1,
"r_y0": 408.4,
"r_x1": 286.4,
"r_y1": 408.4,
"r_x2": 286.4,
"r_y2": 399.5,
"r_x3": 170.1,
"r_y3": 399.5,
"coord_origin": "TOPLEFT"
},
"text": ", and 2) Our bounding boxes",
"orig": ", and 2) Our bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 420.3,
"r_x1": 182.0,
"r_y1": 420.3,
"r_x2": 182.0,
"r_y2": 411.4,
"r_x3": 50.1,
"r_y3": 411.4,
"coord_origin": "TOPLEFT"
},
"text": "generation mechanism (see Sec.",
"orig": "generation mechanism (see Sec.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.1,
"r_y0": 420.3,
"r_x1": 197.7,
"r_y1": 420.3,
"r_x2": 197.7,
"r_y2": 411.4,
"r_x3": 189.1,
"r_y3": 411.4,
"coord_origin": "TOPLEFT"
},
"text": "3)",
"orig": "3)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.3,
"r_y0": 420.3,
"r_x1": 286.4,
"r_y1": 420.3,
"r_x2": 286.4,
"r_y2": 411.4,
"r_x3": 200.3,
"r_y3": 411.4,
"coord_origin": "TOPLEFT"
},
"text": "ensures a one-to-one",
"orig": "ensures a one-to-one",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 432.3,
"r_x1": 286.4,
"r_y1": 432.3,
"r_x2": 286.4,
"r_y2": 423.4,
"r_x3": 50.1,
"r_y3": 423.4,
"coord_origin": "TOPLEFT"
},
"text": "mapping between the cell content and its bounding box for",
"orig": "mapping between the cell content and its bounding box for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 444.2,
"r_x1": 158.3,
"r_y1": 444.2,
"r_x2": 158.3,
"r_y2": 435.3,
"r_x3": 50.1,
"r_y3": 435.3,
"coord_origin": "TOPLEFT"
},
"text": "all post-processed datasets.",
"orig": "all post-processed datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Loss Functions. We formulate a multi-task loss Eq. 2 to train our network. The Cross-Entropy loss (denoted as l$_{s}$ ) is used to train the Structure Decoder which predicts the structure tokens. As for the Cell BBox Decoder it is trained with a combination of losses denoted as l$_{box}$ . l$_{box}$ consists of the generally used l$_{1}$ loss for object detection and the IoU loss ( l$_{iou}$ ) to be scale invariant as explained in [25]. In comparison to DETR, we do not use the Hungarian algorithm [15] to match the predicted bounding boxes with the ground-truth boxes, as we have already achieved a one-toone match through two steps: 1) Our token input sequence is naturally ordered, therefore the hidden states of the table data cells are also in order when they are provided as input to the Cell BBox Decoder , and 2) Our bounding boxes generation mechanism (see Sec. 3) ensures a one-to-one mapping between the cell content and its bounding box for all post-processed datasets."
},
{
"label": "text",
"id": 11,
"page_no": 5,
"cluster": {
"id": 11,
"label": "text",
"bbox": {
"l": 50.1,
"t": 448.0,
"r": 286.4,
"b": 468.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 456.9,
"r_x1": 286.4,
"r_y1": 456.9,
"r_x2": 286.4,
"r_y2": 448.0,
"r_x3": 62.1,
"r_y3": 448.0,
"coord_origin": "TOPLEFT"
},
"text": "The loss used to train the TableFormer can be defined as",
"orig": "The loss used to train the TableFormer can be defined as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 468.9,
"r_x1": 91.4,
"r_y1": 468.9,
"r_x2": 91.4,
"r_y2": 460.0,
"r_x3": 50.1,
"r_y3": 460.0,
"coord_origin": "TOPLEFT"
},
"text": "following:",
"orig": "following:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The loss used to train the TableFormer can be defined as following:"
},
{
"label": "formula",
"id": 15,
"page_no": 5,
"cluster": {
"id": 15,
"label": "formula",
"bbox": {
"l": 124.3,
"t": 493.3,
"r": 286.4,
"b": 517.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.7,
"r_y0": 502.1,
"r_x1": 140.6,
"r_y1": 502.1,
"r_x2": 140.6,
"r_y2": 493.3,
"r_x3": 125.7,
"r_y3": 493.3,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.9,
"r_y0": 502.1,
"r_x1": 151.7,
"r_y1": 502.1,
"r_x2": 151.7,
"r_y2": 493.3,
"r_x3": 143.9,
"r_y3": 493.3,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 154.4,
"r_y0": 502.1,
"r_x1": 186.6,
"r_y1": 502.1,
"r_x2": 186.6,
"r_y2": 493.3,
"r_x3": 154.4,
"r_y3": 493.3,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{iou}$l$_{iou}$",
"orig": "\u03bb$_{iou}$l$_{iou}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.3,
"r_y0": 502.1,
"r_x1": 197.1,
"r_y1": 502.1,
"r_x2": 197.1,
"r_y2": 493.3,
"r_x3": 189.3,
"r_y3": 493.3,
"coord_origin": "TOPLEFT"
},
"text": "+",
"orig": "+",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 199.3,
"r_y0": 502.1,
"r_x1": 211.6,
"r_y1": 502.1,
"r_x2": 211.6,
"r_y2": 493.3,
"r_x3": 199.3,
"r_y3": 493.3,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{l}$$_{1}$",
"orig": "\u03bb$_{l}$$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 124.3,
"r_y0": 517.1,
"r_x1": 127.3,
"r_y1": 517.1,
"r_x2": 127.3,
"r_y2": 508.2,
"r_x3": 124.3,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "l",
"orig": "l",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 130.3,
"r_y0": 517.1,
"r_x1": 138.0,
"r_y1": 517.1,
"r_x2": 138.0,
"r_y2": 508.2,
"r_x3": 130.3,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.8,
"r_y0": 517.1,
"r_x1": 153.3,
"r_y1": 517.1,
"r_x2": 153.3,
"r_y2": 508.2,
"r_x3": 140.8,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "\u03bbl$_{s}$",
"orig": "\u03bbl$_{s}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 156.0,
"r_y0": 517.1,
"r_x1": 174.9,
"r_y1": 517.1,
"r_x2": 174.9,
"r_y2": 508.2,
"r_x3": 156.0,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "+ (1",
"orig": "+ (1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 177.1,
"r_y0": 517.1,
"r_x1": 184.8,
"r_y1": 517.1,
"r_x2": 184.8,
"r_y2": 507.7,
"r_x3": 177.1,
"r_y3": 507.7,
"coord_origin": "TOPLEFT"
},
"text": "\u2212",
"orig": "\u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.0,
"r_y0": 517.1,
"r_x1": 192.8,
"r_y1": 517.1,
"r_x2": 192.8,
"r_y2": 508.2,
"r_x3": 187.0,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 192.8,
"r_y0": 517.1,
"r_x1": 196.7,
"r_y1": 517.1,
"r_x2": 196.7,
"r_y2": 508.2,
"r_x3": 192.8,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.7,
"r_y0": 517.1,
"r_x1": 211.6,
"r_y1": 517.1,
"r_x2": 211.6,
"r_y2": 508.2,
"r_x3": 196.7,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.7,
"r_y0": 509.9,
"r_x1": 286.4,
"r_y1": 509.9,
"r_x2": 286.4,
"r_y2": 501.0,
"r_x3": 274.7,
"r_y3": 501.0,
"coord_origin": "TOPLEFT"
},
"text": "(1)",
"orig": "(1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "l$_{box}$ = \u03bb$_{iou}$l$_{iou}$ + \u03bb$_{l}$$_{1}$ l = \u03bbl$_{s}$ + (1 \u2212 \u03bb ) l$_{box}$ (1)"
},
{
"label": "text",
"id": 16,
"page_no": 5,
"cluster": {
"id": 16,
"label": "text",
"bbox": {
"l": 50.1,
"t": 530.6,
"r": 281.6,
"b": 540.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 540.2,
"r_x1": 74.5,
"r_y1": 540.2,
"r_x2": 74.5,
"r_y2": 531.3,
"r_x3": 50.1,
"r_y3": 531.3,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.9,
"r_y0": 540.0,
"r_x1": 82.8,
"r_y1": 540.0,
"r_x2": 82.8,
"r_y2": 531.1,
"r_x3": 76.9,
"r_y3": 531.1,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 85.5,
"r_y0": 540.0,
"r_x1": 92.2,
"r_y1": 540.0,
"r_x2": 92.2,
"r_y2": 530.6,
"r_x3": 85.5,
"r_y3": 530.6,
"coord_origin": "TOPLEFT"
},
"text": "\u2208",
"orig": "\u2208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 94.7,
"r_y0": 540.2,
"r_x1": 135.6,
"r_y1": 540.2,
"r_x2": 135.6,
"r_y2": 531.3,
"r_x3": 94.7,
"r_y3": 531.3,
"coord_origin": "TOPLEFT"
},
"text": "[0, 1], and",
"orig": "[0, 1], and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.1,
"r_y0": 540.0,
"r_x1": 172.6,
"r_y1": 540.0,
"r_x2": 172.6,
"r_y2": 531.1,
"r_x3": 138.1,
"r_y3": 531.1,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$",
"orig": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.9,
"r_y0": 540.0,
"r_x1": 192.5,
"r_y1": 540.0,
"r_x2": 192.5,
"r_y2": 530.6,
"r_x3": 175.9,
"r_y3": 530.6,
"coord_origin": "TOPLEFT"
},
"text": "\u2208$_{R}$",
"orig": "\u2208$_{R}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 195.0,
"r_y0": 540.2,
"r_x1": 281.6,
"r_y1": 540.2,
"r_x2": 281.6,
"r_y2": 531.3,
"r_x3": 195.0,
"r_y3": 531.3,
"coord_origin": "TOPLEFT"
},
"text": "are hyper-parameters.",
"orig": "are hyper-parameters.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "where \u03bb \u2208 [0, 1], and \u03bb$_{iou}$, \u03bb$_{l}$$_{1}$ \u2208$_{R}$ are hyper-parameters."
},
{
"label": "section_header",
"id": 12,
"page_no": 5,
"cluster": {
"id": 12,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 555.9,
"r": 172.0,
"b": 566.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 566.7,
"r_x1": 57.9,
"r_y1": 566.7,
"r_x2": 57.9,
"r_y2": 555.9,
"r_x3": 50.1,
"r_y3": 555.9,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.4,
"r_y0": 566.7,
"r_x1": 172.0,
"r_y1": 566.7,
"r_x2": 172.0,
"r_y2": 555.9,
"r_x3": 68.4,
"r_y3": 555.9,
"coord_origin": "TOPLEFT"
},
"text": "Experimental Results",
"orig": "Experimental Results",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5. Experimental Results"
},
{
"label": "section_header",
"id": 13,
"page_no": 5,
"cluster": {
"id": 13,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 576.3,
"r": 179.2,
"b": 586.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 586.1,
"r_x1": 64.7,
"r_y1": 586.1,
"r_x2": 64.7,
"r_y2": 576.3,
"r_x3": 50.1,
"r_y3": 576.3,
"coord_origin": "TOPLEFT"
},
"text": "5.1.",
"orig": "5.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.4,
"r_y0": 586.1,
"r_x1": 179.2,
"r_y1": 586.1,
"r_x2": 179.2,
"r_y2": 576.3,
"r_x3": 74.4,
"r_y3": 576.3,
"coord_origin": "TOPLEFT"
},
"text": "Implementation Details",
"orig": "Implementation Details",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5.1. Implementation Details"
},
{
"label": "text",
"id": 7,
"page_no": 5,
"cluster": {
"id": 7,
"label": "text",
"bbox": {
"l": 50.1,
"t": 595.7,
"r": 286.4,
"b": 640.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 604.6,
"r_x1": 203.0,
"r_y1": 604.6,
"r_x2": 203.0,
"r_y2": 595.7,
"r_x3": 62.1,
"r_y3": 595.7,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer uses ResNet-18 as the",
"orig": "TableFormer uses ResNet-18 as the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 205.4,
"r_y0": 604.4,
"r_x1": 286.4,
"r_y1": 604.4,
"r_x2": 286.4,
"r_y2": 595.8,
"r_x3": 205.4,
"r_y3": 595.8,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Net-",
"orig": "CNN Backbone Net-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 616.4,
"r_x1": 70.0,
"r_y1": 616.4,
"r_x2": 70.0,
"r_y2": 607.8,
"r_x3": 50.1,
"r_y3": 607.8,
"coord_origin": "TOPLEFT"
},
"text": "work",
"orig": "work",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 616.6,
"r_x1": 286.4,
"r_y1": 616.6,
"r_x2": 286.4,
"r_y2": 607.7,
"r_x3": 70.0,
"r_y3": 607.7,
"coord_origin": "TOPLEFT"
},
"text": ". The input images are resized to 448*448 pixels and",
"orig": ". The input images are resized to 448*448 pixels and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 628.6,
"r_x1": 286.4,
"r_y1": 628.6,
"r_x2": 286.4,
"r_y2": 619.6,
"r_x3": 50.1,
"r_y3": 619.6,
"coord_origin": "TOPLEFT"
},
"text": "the feature map has a dimension of 28*28. Additionally, we",
"orig": "the feature map has a dimension of 28*28. Additionally, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 640.5,
"r_x1": 207.0,
"r_y1": 640.5,
"r_x2": 207.0,
"r_y2": 631.6,
"r_x3": 50.1,
"r_y3": 631.6,
"coord_origin": "TOPLEFT"
},
"text": "enforce the following input constraints:",
"orig": "enforce the following input constraints:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TableFormer uses ResNet-18 as the CNN Backbone Network . The input images are resized to 448*448 pixels and the feature map has a dimension of 28*28. Additionally, we enforce the following input constraints:"
},
{
"label": "formula",
"id": 18,
"page_no": 5,
"cluster": {
"id": 18,
"label": "formula",
"bbox": {
"l": 91.7,
"t": 653.8,
"r": 286.4,
"b": 678.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.7,
"r_y0": 663.5,
"r_x1": 186.0,
"r_y1": 663.5,
"r_x2": 186.0,
"r_y2": 654.5,
"r_x3": 91.7,
"r_y3": 654.5,
"coord_origin": "TOPLEFT"
},
"text": "Image width and height",
"orig": "Image width and height",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.5,
"r_y0": 663.2,
"r_x1": 196.3,
"r_y1": 663.2,
"r_x2": 196.3,
"r_y2": 653.8,
"r_x3": 188.5,
"r_y3": 653.8,
"coord_origin": "TOPLEFT"
},
"text": "\u2264",
"orig": "\u2264",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 198.7,
"r_y0": 663.5,
"r_x1": 244.8,
"r_y1": 663.5,
"r_x2": 244.8,
"r_y2": 654.5,
"r_x3": 198.7,
"r_y3": 654.5,
"coord_origin": "TOPLEFT"
},
"text": "1024 pixels",
"orig": "1024 pixels",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.0,
"r_y0": 678.4,
"r_x1": 186.2,
"r_y1": 678.4,
"r_x2": 186.2,
"r_y2": 669.5,
"r_x3": 101.0,
"r_y3": 669.5,
"coord_origin": "TOPLEFT"
},
"text": "Structural tags length",
"orig": "Structural tags length",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.7,
"r_y0": 678.2,
"r_x1": 196.5,
"r_y1": 678.2,
"r_x2": 196.5,
"r_y2": 668.8,
"r_x3": 188.7,
"r_y3": 668.8,
"coord_origin": "TOPLEFT"
},
"text": "\u2264",
"orig": "\u2264",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 199.0,
"r_y0": 678.4,
"r_x1": 244.8,
"r_y1": 678.4,
"r_x2": 244.8,
"r_y2": 669.5,
"r_x3": 199.0,
"r_y3": 669.5,
"coord_origin": "TOPLEFT"
},
"text": "512 tokens.",
"orig": "512 tokens.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.7,
"r_y0": 671.0,
"r_x1": 286.4,
"r_y1": 671.0,
"r_x2": 286.4,
"r_y2": 662.1,
"r_x3": 274.7,
"r_y3": 662.1,
"coord_origin": "TOPLEFT"
},
"text": "(2)",
"orig": "(2)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Image width and height \u2264 1024 pixels Structural tags length \u2264 512 tokens. (2)"
},
{
"label": "text",
"id": 10,
"page_no": 5,
"cluster": {
"id": 10,
"label": "text",
"bbox": {
"l": 50.1,
"t": 692.3,
"r": 286.4,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "Although input constraints are used also by other methods,",
"orig": "Although input constraints are used also by other methods,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 286.4,
"r_y1": 713.2,
"r_x2": 286.4,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "such as EDD, ours are less restrictive due to the improved",
"orig": "such as EDD, ours are less restrictive due to the improved",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Although input constraints are used also by other methods, such as EDD, ours are less restrictive due to the improved"
},
{
"label": "text",
"id": 9,
"page_no": 5,
"cluster": {
"id": 9,
"label": "text",
"bbox": {
"l": 308.9,
"t": 75.2,
"r": 545.1,
"b": 108.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 84.1,
"r_x1": 545.1,
"r_y1": 84.1,
"r_x2": 545.1,
"r_y2": 75.2,
"r_x3": 308.9,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "runtime performance and lower memory footprint of Table-",
"orig": "runtime performance and lower memory footprint of Table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 96.1,
"r_x1": 340.0,
"r_y1": 96.1,
"r_x2": 340.0,
"r_y2": 87.2,
"r_x3": 308.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "Former.",
"orig": "Former.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.9,
"r_y0": 96.1,
"r_x1": 545.1,
"r_y1": 96.1,
"r_x2": 545.1,
"r_y2": 87.2,
"r_x3": 346.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "This allows to utilize input samples with longer",
"orig": "This allows to utilize input samples with longer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 108.0,
"r_x1": 493.0,
"r_y1": 108.0,
"r_x2": 493.0,
"r_y2": 99.1,
"r_x3": 308.9,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "sequences and images with larger dimensions.",
"orig": "sequences and images with larger dimensions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "runtime performance and lower memory footprint of TableFormer. This allows to utilize input samples with longer sequences and images with larger dimensions."
},
{
"label": "text",
"id": 1,
"page_no": 5,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 308.9,
"t": 116.2,
"r": 545.1,
"b": 328.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 125.1,
"r_x1": 545.1,
"r_y1": 125.1,
"r_x2": 545.1,
"r_y2": 116.2,
"r_x3": 320.8,
"r_y3": 116.2,
"coord_origin": "TOPLEFT"
},
"text": "The Transformer Encoder consists of two \u201cTransformer",
"orig": "The Transformer Encoder consists of two \u201cTransformer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 137.1,
"r_x1": 545.1,
"r_y1": 137.1,
"r_x2": 545.1,
"r_y2": 128.2,
"r_x3": 308.9,
"r_y3": 128.2,
"coord_origin": "TOPLEFT"
},
"text": "Encoder Layers\u201d, with an input feature size of 512, feed",
"orig": "Encoder Layers\u201d, with an input feature size of 512, feed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 149.0,
"r_x1": 545.1,
"r_y1": 149.0,
"r_x2": 545.1,
"r_y2": 140.1,
"r_x3": 308.9,
"r_y3": 140.1,
"coord_origin": "TOPLEFT"
},
"text": "forward network of 1024, and 4 attention heads. As for the",
"orig": "forward network of 1024, and 4 attention heads. As for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 161.0,
"r_x1": 545.1,
"r_y1": 161.0,
"r_x2": 545.1,
"r_y2": 152.1,
"r_x3": 308.9,
"r_y3": 152.1,
"coord_origin": "TOPLEFT"
},
"text": "Transformer Decoder it is composed of four \u201cTransformer",
"orig": "Transformer Decoder it is composed of four \u201cTransformer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 173.0,
"r_x1": 545.1,
"r_y1": 173.0,
"r_x2": 545.1,
"r_y2": 164.0,
"r_x3": 308.9,
"r_y3": 164.0,
"coord_origin": "TOPLEFT"
},
"text": "Decoder Layers\u201d with similar input and output dimensions",
"orig": "Decoder Layers\u201d with similar input and output dimensions",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 184.9,
"r_x1": 467.2,
"r_y1": 184.9,
"r_x2": 467.2,
"r_y2": 176.0,
"r_x3": 308.9,
"r_y3": 176.0,
"coord_origin": "TOPLEFT"
},
"text": "as the \u201cTransformer Encoder Layers\u201d.",
"orig": "as the \u201cTransformer Encoder Layers\u201d.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 475.4,
"r_y0": 184.9,
"r_x1": 545.1,
"r_y1": 184.9,
"r_x2": 545.1,
"r_y2": 176.0,
"r_x3": 475.4,
"r_y3": 176.0,
"coord_origin": "TOPLEFT"
},
"text": "Even though our",
"orig": "Even though our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 196.9,
"r_x1": 545.1,
"r_y1": 196.9,
"r_x2": 545.1,
"r_y2": 188.0,
"r_x3": 308.9,
"r_y3": 188.0,
"coord_origin": "TOPLEFT"
},
"text": "model uses fewer layers and heads than the default imple-",
"orig": "model uses fewer layers and heads than the default imple-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 208.8,
"r_x1": 545.1,
"r_y1": 208.8,
"r_x2": 545.1,
"r_y2": 199.9,
"r_x3": 308.9,
"r_y3": 199.9,
"coord_origin": "TOPLEFT"
},
"text": "mentation parameters, our extensive experimentation has",
"orig": "mentation parameters, our extensive experimentation has",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 220.8,
"r_x1": 545.1,
"r_y1": 220.8,
"r_x2": 545.1,
"r_y2": 211.9,
"r_x3": 308.9,
"r_y3": 211.9,
"coord_origin": "TOPLEFT"
},
"text": "proved this setup to be more suitable for table images. We",
"orig": "proved this setup to be more suitable for table images. We",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 232.7,
"r_x1": 545.1,
"r_y1": 232.7,
"r_x2": 545.1,
"r_y2": 223.8,
"r_x3": 308.9,
"r_y3": 223.8,
"coord_origin": "TOPLEFT"
},
"text": "attribute this finding to the inherent design of table im-",
"orig": "attribute this finding to the inherent design of table im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 244.7,
"r_x1": 545.1,
"r_y1": 244.7,
"r_x2": 545.1,
"r_y2": 235.8,
"r_x3": 308.9,
"r_y3": 235.8,
"coord_origin": "TOPLEFT"
},
"text": "ages, which contain mostly lines and text, unlike the more",
"orig": "ages, which contain mostly lines and text, unlike the more",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 256.6,
"r_x1": 545.1,
"r_y1": 256.6,
"r_x2": 545.1,
"r_y2": 247.7,
"r_x3": 308.9,
"r_y3": 247.7,
"coord_origin": "TOPLEFT"
},
"text": "elaborate content present in other scopes (e.g. the COCO",
"orig": "elaborate content present in other scopes (e.g. the COCO",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 268.6,
"r_x1": 342.3,
"r_y1": 268.6,
"r_x2": 342.3,
"r_y2": 259.7,
"r_x3": 308.9,
"r_y3": 259.7,
"coord_origin": "TOPLEFT"
},
"text": "dataset).",
"orig": "dataset).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 349.0,
"r_y0": 268.6,
"r_x1": 545.1,
"r_y1": 268.6,
"r_x2": 545.1,
"r_y2": 259.7,
"r_x3": 349.0,
"r_y3": 259.7,
"coord_origin": "TOPLEFT"
},
"text": "Moreover, we have added ResNet blocks to the",
"orig": "Moreover, we have added ResNet blocks to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 280.6,
"r_x1": 545.1,
"r_y1": 280.6,
"r_x2": 545.1,
"r_y2": 271.6,
"r_x3": 308.9,
"r_y3": 271.6,
"coord_origin": "TOPLEFT"
},
"text": "inputs of the Structure Decoder and Cell BBox Decoder.",
"orig": "inputs of the Structure Decoder and Cell BBox Decoder.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 292.5,
"r_x1": 545.1,
"r_y1": 292.5,
"r_x2": 545.1,
"r_y2": 283.6,
"r_x3": 308.9,
"r_y3": 283.6,
"coord_origin": "TOPLEFT"
},
"text": "This prevents a decoder having a stronger influence over the",
"orig": "This prevents a decoder having a stronger influence over the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 304.5,
"r_x1": 545.1,
"r_y1": 304.5,
"r_x2": 545.1,
"r_y2": 295.6,
"r_x3": 308.9,
"r_y3": 295.6,
"coord_origin": "TOPLEFT"
},
"text": "learned weights which would damage the other prediction",
"orig": "learned weights which would damage the other prediction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 316.4,
"r_x1": 545.1,
"r_y1": 316.4,
"r_x2": 545.1,
"r_y2": 307.5,
"r_x3": 308.9,
"r_y3": 307.5,
"coord_origin": "TOPLEFT"
},
"text": "task (structure vs bounding boxes), but learn task specific",
"orig": "task (structure vs bounding boxes), but learn task specific",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 328.4,
"r_x1": 532.5,
"r_y1": 328.4,
"r_x2": 532.5,
"r_y2": 319.5,
"r_x3": 308.9,
"r_y3": 319.5,
"coord_origin": "TOPLEFT"
},
"text": "weights instead. Lastly our dropout layers are set to 0.5.",
"orig": "weights instead. Lastly our dropout layers are set to 0.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The Transformer Encoder consists of two \"Transformer Encoder Layers\", with an input feature size of 512, feed forward network of 1024, and 4 attention heads. As for the Transformer Decoder it is composed of four \"Transformer Decoder Layers\" with similar input and output dimensions as the \"Transformer Encoder Layers\". Even though our model uses fewer layers and heads than the default implementation parameters, our extensive experimentation has proved this setup to be more suitable for table images. We attribute this finding to the inherent design of table images, which contain mostly lines and text, unlike the more elaborate content present in other scopes (e.g. the COCO dataset). Moreover, we have added ResNet blocks to the inputs of the Structure Decoder and Cell BBox Decoder. This prevents a decoder having a stronger influence over the learned weights which would damage the other prediction task (structure vs bounding boxes), but learn task specific weights instead. Lastly our dropout layers are set to 0.5."
},
{
"label": "text",
"id": 3,
"page_no": 5,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 308.9,
"t": 336.6,
"r": 545.1,
"b": 429.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 345.5,
"r_x1": 545.1,
"r_y1": 345.5,
"r_x2": 545.1,
"r_y2": 336.6,
"r_x3": 320.8,
"r_y3": 336.6,
"coord_origin": "TOPLEFT"
},
"text": "For training, TableFormer is trained with 3 Adam opti-",
"orig": "For training, TableFormer is trained with 3 Adam opti-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 357.4,
"r_x1": 403.7,
"r_y1": 357.4,
"r_x2": 403.7,
"r_y2": 348.5,
"r_x3": 308.9,
"r_y3": 348.5,
"coord_origin": "TOPLEFT"
},
"text": "mizers, each one for the",
"orig": "mizers, each one for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.1,
"r_y0": 357.2,
"r_x1": 503.5,
"r_y1": 357.2,
"r_x2": 503.5,
"r_y2": 348.6,
"r_x3": 406.1,
"r_y3": 348.6,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network",
"orig": "CNN Backbone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 503.5,
"r_y0": 357.4,
"r_x1": 506.0,
"r_y1": 357.4,
"r_x2": 506.0,
"r_y2": 348.5,
"r_x3": 503.5,
"r_y3": 348.5,
"coord_origin": "TOPLEFT"
},
"text": ",",
"orig": ",",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.4,
"r_y0": 357.2,
"r_x1": 545.1,
"r_y1": 357.2,
"r_x2": 545.1,
"r_y2": 348.6,
"r_x3": 508.4,
"r_y3": 348.6,
"coord_origin": "TOPLEFT"
},
"text": "Structure",
"orig": "Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 369.2,
"r_x1": 343.2,
"r_y1": 369.2,
"r_x2": 343.2,
"r_y2": 360.6,
"r_x3": 308.9,
"r_y3": 360.6,
"coord_origin": "TOPLEFT"
},
"text": "Decoder",
"orig": "Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 343.2,
"r_y0": 369.4,
"r_x1": 362.2,
"r_y1": 369.4,
"r_x2": 362.2,
"r_y2": 360.5,
"r_x3": 343.2,
"r_y3": 360.5,
"coord_origin": "TOPLEFT"
},
"text": ", and",
"orig": ", and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 364.3,
"r_y0": 369.2,
"r_x1": 440.9,
"r_y1": 369.2,
"r_x2": 440.9,
"r_y2": 360.6,
"r_x3": 364.3,
"r_y3": 360.6,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.9,
"r_y0": 369.4,
"r_x1": 545.1,
"r_y1": 369.4,
"r_x2": 545.1,
"r_y2": 360.5,
"r_x3": 440.9,
"r_y3": 360.5,
"coord_origin": "TOPLEFT"
},
"text": ". Taking the PubTabNet as",
"orig": ". Taking the PubTabNet as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 381.3,
"r_x1": 545.1,
"r_y1": 381.3,
"r_x2": 545.1,
"r_y2": 372.4,
"r_x3": 308.9,
"r_y3": 372.4,
"coord_origin": "TOPLEFT"
},
"text": "an example for our parameter set up, the initializing learn-",
"orig": "an example for our parameter set up, the initializing learn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 393.3,
"r_x1": 545.1,
"r_y1": 393.3,
"r_x2": 545.1,
"r_y2": 384.4,
"r_x3": 308.9,
"r_y3": 384.4,
"coord_origin": "TOPLEFT"
},
"text": "ing rate is 0.001 for 12 epochs with a batch size of 24, and",
"orig": "ing rate is 0.001 for 12 epochs with a batch size of 24, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 405.0,
"r_x1": 314.7,
"r_y1": 405.0,
"r_x2": 314.7,
"r_y2": 396.2,
"r_x3": 308.9,
"r_y3": 396.2,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.7,
"r_y0": 405.3,
"r_x1": 360.4,
"r_y1": 405.3,
"r_x2": 360.4,
"r_y2": 396.4,
"r_x3": 318.7,
"r_y3": 396.4,
"coord_origin": "TOPLEFT"
},
"text": "set to 0.5.",
"orig": "set to 0.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 368.0,
"r_y0": 405.3,
"r_x1": 545.1,
"r_y1": 405.3,
"r_x2": 545.1,
"r_y2": 396.4,
"r_x3": 368.0,
"r_y3": 396.4,
"coord_origin": "TOPLEFT"
},
"text": "Afterwards, we reduce the learning rate to",
"orig": "Afterwards, we reduce the learning rate to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 417.2,
"r_x1": 545.1,
"r_y1": 417.2,
"r_x2": 545.1,
"r_y2": 408.3,
"r_x3": 308.9,
"r_y3": 408.3,
"coord_origin": "TOPLEFT"
},
"text": "0.0001, the batch size to 18 and train for 12 more epochs or",
"orig": "0.0001, the batch size to 18 and train for 12 more epochs or",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 429.2,
"r_x1": 361.0,
"r_y1": 429.2,
"r_x2": 361.0,
"r_y2": 420.3,
"r_x3": 308.9,
"r_y3": 420.3,
"coord_origin": "TOPLEFT"
},
"text": "convergence.",
"orig": "convergence.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "For training, TableFormer is trained with 3 Adam optimizers, each one for the CNN Backbone Network , Structure Decoder , and Cell BBox Decoder . Taking the PubTabNet as an example for our parameter set up, the initializing learning rate is 0.001 for 12 epochs with a batch size of 24, and \u03bb set to 0.5. Afterwards, we reduce the learning rate to 0.0001, the batch size to 18 and train for 12 more epochs or convergence."
},
{
"label": "text",
"id": 0,
"page_no": 5,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 308.9,
"t": 437.4,
"r": 545.1,
"b": 553.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 446.3,
"r_x1": 545.1,
"r_y1": 446.3,
"r_x2": 545.1,
"r_y2": 437.4,
"r_x3": 320.8,
"r_y3": 437.4,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer is implemented with PyTorch and Torchvi-",
"orig": "TableFormer is implemented with PyTorch and Torchvi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 458.2,
"r_x1": 384.6,
"r_y1": 458.2,
"r_x2": 384.6,
"r_y2": 449.3,
"r_x3": 308.9,
"r_y3": 449.3,
"coord_origin": "TOPLEFT"
},
"text": "sion libraries [22].",
"orig": "sion libraries [22].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.4,
"r_y0": 458.2,
"r_x1": 545.1,
"r_y1": 458.2,
"r_x2": 545.1,
"r_y2": 449.3,
"r_x3": 391.4,
"r_y3": 449.3,
"coord_origin": "TOPLEFT"
},
"text": "To speed up the inference, the image",
"orig": "To speed up the inference, the image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 470.2,
"r_x1": 494.0,
"r_y1": 470.2,
"r_x2": 494.0,
"r_y2": 461.3,
"r_x3": 308.9,
"r_y3": 461.3,
"coord_origin": "TOPLEFT"
},
"text": "undergoes a single forward pass through the",
"orig": "undergoes a single forward pass through the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.1,
"r_y0": 470.0,
"r_x1": 545.1,
"r_y1": 470.0,
"r_x2": 545.1,
"r_y2": 461.4,
"r_x3": 498.1,
"r_y3": 461.4,
"coord_origin": "TOPLEFT"
},
"text": "CNN Back-",
"orig": "CNN Back-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 481.9,
"r_x1": 364.4,
"r_y1": 481.9,
"r_x2": 364.4,
"r_y2": 473.3,
"r_x3": 308.9,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "bone Network",
"orig": "bone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.1,
"r_y0": 482.1,
"r_x1": 545.1,
"r_y1": 482.1,
"r_x2": 545.1,
"r_y2": 473.2,
"r_x3": 367.1,
"r_y3": 473.2,
"coord_origin": "TOPLEFT"
},
"text": "and transformer encoder. This eliminates the",
"orig": "and transformer encoder. This eliminates the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 494.1,
"r_x1": 545.1,
"r_y1": 494.1,
"r_x2": 545.1,
"r_y2": 485.2,
"r_x3": 308.9,
"r_y3": 485.2,
"coord_origin": "TOPLEFT"
},
"text": "overhead of generating the same features for each decoding",
"orig": "overhead of generating the same features for each decoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 506.1,
"r_x1": 545.1,
"r_y1": 506.1,
"r_x2": 545.1,
"r_y2": 497.1,
"r_x3": 308.9,
"r_y3": 497.1,
"coord_origin": "TOPLEFT"
},
"text": "step. Similarly, we employ a \u2019caching\u2019 technique to preform",
"orig": "step. Similarly, we employ a \u2019caching\u2019 technique to preform",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 518.0,
"r_x1": 545.1,
"r_y1": 518.0,
"r_x2": 545.1,
"r_y2": 509.1,
"r_x3": 308.9,
"r_y3": 509.1,
"coord_origin": "TOPLEFT"
},
"text": "faster autoregressive decoding. This is achieved by storing",
"orig": "faster autoregressive decoding. This is achieved by storing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 530.0,
"r_x1": 545.1,
"r_y1": 530.0,
"r_x2": 545.1,
"r_y2": 521.1,
"r_x3": 308.9,
"r_y3": 521.1,
"coord_origin": "TOPLEFT"
},
"text": "the features of decoded tokens so we can reuse them for",
"orig": "the features of decoded tokens so we can reuse them for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 541.9,
"r_x1": 545.1,
"r_y1": 541.9,
"r_x2": 545.1,
"r_y2": 533.0,
"r_x3": 308.9,
"r_y3": 533.0,
"coord_origin": "TOPLEFT"
},
"text": "each time step. Therefore, we only compute the attention",
"orig": "each time step. Therefore, we only compute the attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 553.9,
"r_x1": 377.2,
"r_y1": 553.9,
"r_x2": 377.2,
"r_y2": 545.0,
"r_x3": 308.9,
"r_y3": 545.0,
"coord_origin": "TOPLEFT"
},
"text": "for each new tag.",
"orig": "for each new tag.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TableFormer is implemented with PyTorch and Torchvision libraries [22]. To speed up the inference, the image undergoes a single forward pass through the CNN Backbone Network and transformer encoder. This eliminates the overhead of generating the same features for each decoding step. Similarly, we employ a 'caching' technique to preform faster autoregressive decoding. This is achieved by storing the features of decoded tokens so we can reuse them for each time step. Therefore, we only compute the attention for each new tag."
},
{
"label": "section_header",
"id": 14,
"page_no": 5,
"cluster": {
"id": 14,
"label": "section_header",
"bbox": {
"l": 308.9,
"t": 579.6,
"r": 397.4,
"b": 589.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 589.4,
"r_x1": 323.9,
"r_y1": 589.4,
"r_x2": 323.9,
"r_y2": 579.6,
"r_x3": 308.9,
"r_y3": 579.6,
"coord_origin": "TOPLEFT"
},
"text": "5.2.",
"orig": "5.2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.9,
"r_y0": 589.4,
"r_x1": 397.4,
"r_y1": 589.4,
"r_x2": 397.4,
"r_y2": 579.6,
"r_x3": 333.9,
"r_y3": 579.6,
"coord_origin": "TOPLEFT"
},
"text": "Generalization",
"orig": "Generalization",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5.2. Generalization"
},
{
"label": "text",
"id": 2,
"page_no": 5,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 308.9,
"t": 603.4,
"r": 545.1,
"b": 672.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 612.4,
"r_x1": 545.1,
"r_y1": 612.4,
"r_x2": 545.1,
"r_y2": 603.4,
"r_x3": 320.8,
"r_y3": 603.4,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer is evaluated on three major publicly avail-",
"orig": "TableFormer is evaluated on three major publicly avail-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 624.3,
"r_x1": 545.1,
"r_y1": 624.3,
"r_x2": 545.1,
"r_y2": 615.4,
"r_x3": 308.9,
"r_y3": 615.4,
"coord_origin": "TOPLEFT"
},
"text": "able datasets of different nature to prove the generalization",
"orig": "able datasets of different nature to prove the generalization",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 636.3,
"r_x1": 545.1,
"r_y1": 636.3,
"r_x2": 545.1,
"r_y2": 627.4,
"r_x3": 308.9,
"r_y3": 627.4,
"coord_origin": "TOPLEFT"
},
"text": "and effectiveness of our model. The datasets used for eval-",
"orig": "and effectiveness of our model. The datasets used for eval-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 648.2,
"r_x1": 545.1,
"r_y1": 648.2,
"r_x2": 545.1,
"r_y2": 639.3,
"r_x3": 308.9,
"r_y3": 639.3,
"coord_origin": "TOPLEFT"
},
"text": "uation are the PubTabNet, FinTabNet and TableBank which",
"orig": "uation are the PubTabNet, FinTabNet and TableBank which",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 660.2,
"r_x1": 545.1,
"r_y1": 660.2,
"r_x2": 545.1,
"r_y2": 651.3,
"r_x3": 308.9,
"r_y3": 651.3,
"coord_origin": "TOPLEFT"
},
"text": "stem from the scientific, financial and general domains re-",
"orig": "stem from the scientific, financial and general domains re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 672.1,
"r_x1": 350.7,
"r_y1": 672.1,
"r_x2": 350.7,
"r_y2": 663.2,
"r_x3": 308.9,
"r_y3": 663.2,
"coord_origin": "TOPLEFT"
},
"text": "spectively.",
"orig": "spectively.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TableFormer is evaluated on three major publicly available datasets of different nature to prove the generalization and effectiveness of our model. The datasets used for evaluation are the PubTabNet, FinTabNet and TableBank which stem from the scientific, financial and general domains respectively."
},
{
"label": "text",
"id": 8,
"page_no": 5,
"cluster": {
"id": 8,
"label": "text",
"bbox": {
"l": 308.9,
"t": 680.3,
"r": 545.1,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 689.2,
"r_x1": 545.1,
"r_y1": 689.2,
"r_x2": 545.1,
"r_y2": 680.3,
"r_x3": 320.8,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "We also share our baseline results on the challenging",
"orig": "We also share our baseline results on the challenging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 701.2,
"r_x1": 396.2,
"r_y1": 701.2,
"r_x2": 396.2,
"r_y2": 692.3,
"r_x3": 308.9,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet dataset.",
"orig": "SynthTabNet dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.4,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 406.4,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "Throughout our experiments, the",
"orig": "Throughout our experiments, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 495.9,
"r_y1": 713.2,
"r_x2": 495.9,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "same parameters stated in Sec. 5.1 are utilized.",
"orig": "same parameters stated in Sec. 5.1 are utilized.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "We also share our baseline results on the challenging SynthTabNet dataset. Throughout our experiments, the same parameters stated in Sec. 5.1 are utilized."
},
{
"label": "page_footer",
"id": 17,
"page_no": 5,
"cluster": {
"id": 17,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "6"
}
],
"body": [
{
"label": "text",
"id": 5,
"page_no": 5,
"cluster": {
"id": 5,
"label": "text",
"bbox": {
"l": 50.1,
"t": 75.2,
"r": 286.4,
"b": 155.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.1,
"r_x1": 286.4,
"r_y1": 84.1,
"r_x2": 286.4,
"r_y2": 75.2,
"r_x3": 50.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "tention encoding is then multiplied to the encoded image to",
"orig": "tention encoding is then multiplied to the encoded image to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 96.1,
"r_x1": 286.4,
"r_y1": 96.1,
"r_x2": 286.4,
"r_y2": 87.2,
"r_x3": 50.1,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "produce a feature for each table cell. Notice that this is dif-",
"orig": "produce a feature for each table cell. Notice that this is dif-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 108.0,
"r_x1": 286.4,
"r_y1": 108.0,
"r_x2": 286.4,
"r_y2": 99.1,
"r_x3": 50.1,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "ferent than the typical object detection problem where im-",
"orig": "ferent than the typical object detection problem where im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 120.0,
"r_x1": 286.4,
"r_y1": 120.0,
"r_x2": 286.4,
"r_y2": 111.1,
"r_x3": 50.1,
"r_y3": 111.1,
"coord_origin": "TOPLEFT"
},
"text": "balances between the number of detections and the amount",
"orig": "balances between the number of detections and the amount",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 131.9,
"r_x1": 286.4,
"r_y1": 131.9,
"r_x2": 286.4,
"r_y2": 123.0,
"r_x3": 50.1,
"r_y3": 123.0,
"coord_origin": "TOPLEFT"
},
"text": "of objects may exist. In our case, we know up front that",
"orig": "of objects may exist. In our case, we know up front that",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 143.9,
"r_x1": 286.4,
"r_y1": 143.9,
"r_x2": 286.4,
"r_y2": 135.0,
"r_x3": 50.1,
"r_y3": 135.0,
"coord_origin": "TOPLEFT"
},
"text": "the produced detections always match with the table cells",
"orig": "the produced detections always match with the table cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 155.8,
"r_x1": 175.2,
"r_y1": 155.8,
"r_x2": 175.2,
"r_y2": 146.9,
"r_x3": 50.1,
"r_y3": 146.9,
"coord_origin": "TOPLEFT"
},
"text": "in number and correspondence.",
"orig": "in number and correspondence.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "tention encoding is then multiplied to the encoded image to produce a feature for each table cell. Notice that this is different than the typical object detection problem where imbalances between the number of detections and the amount of objects may exist. In our case, we know up front that the produced detections always match with the table cells in number and correspondence."
},
{
"label": "text",
"id": 6,
"page_no": 5,
"cluster": {
"id": 6,
"label": "text",
"bbox": {
"l": 50.1,
"t": 159.6,
"r": 286.4,
"b": 240.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 168.5,
"r_x1": 286.4,
"r_y1": 168.5,
"r_x2": 286.4,
"r_y2": 159.6,
"r_x3": 62.1,
"r_y3": 159.6,
"coord_origin": "TOPLEFT"
},
"text": "The output features for each table cell are then fed",
"orig": "The output features for each table cell are then fed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 180.5,
"r_x1": 286.4,
"r_y1": 180.5,
"r_x2": 286.4,
"r_y2": 171.6,
"r_x3": 50.1,
"r_y3": 171.6,
"coord_origin": "TOPLEFT"
},
"text": "into the feed-forward network (FFN). The FFN consists",
"orig": "into the feed-forward network (FFN). The FFN consists",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 192.4,
"r_x1": 286.4,
"r_y1": 192.4,
"r_x2": 286.4,
"r_y2": 183.5,
"r_x3": 50.1,
"r_y3": 183.5,
"coord_origin": "TOPLEFT"
},
"text": "of a Multi-Layer Perceptron (3 layers with ReLU activa-",
"orig": "of a Multi-Layer Perceptron (3 layers with ReLU activa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 204.4,
"r_x1": 286.4,
"r_y1": 204.4,
"r_x2": 286.4,
"r_y2": 195.5,
"r_x3": 50.1,
"r_y3": 195.5,
"coord_origin": "TOPLEFT"
},
"text": "tion function) that predicts the normalized coordinates for",
"orig": "tion function) that predicts the normalized coordinates for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 216.4,
"r_x1": 286.4,
"r_y1": 216.4,
"r_x2": 286.4,
"r_y2": 207.4,
"r_x3": 50.1,
"r_y3": 207.4,
"coord_origin": "TOPLEFT"
},
"text": "the bounding box of each table cell. Finally, the predicted",
"orig": "the bounding box of each table cell. Finally, the predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 228.3,
"r_x1": 286.4,
"r_y1": 228.3,
"r_x2": 286.4,
"r_y2": 219.4,
"r_x3": 50.1,
"r_y3": 219.4,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes are classified based on whether they are",
"orig": "bounding boxes are classified based on whether they are",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 240.3,
"r_x1": 181.5,
"r_y1": 240.3,
"r_x2": 181.5,
"r_y2": 231.4,
"r_x3": 50.1,
"r_y3": 231.4,
"coord_origin": "TOPLEFT"
},
"text": "empty or not using a linear layer.",
"orig": "empty or not using a linear layer.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The output features for each table cell are then fed into the feed-forward network (FFN). The FFN consists of a Multi-Layer Perceptron (3 layers with ReLU activation function) that predicts the normalized coordinates for the bounding box of each table cell. Finally, the predicted bounding boxes are classified based on whether they are empty or not using a linear layer."
},
{
"label": "text",
"id": 4,
"page_no": 5,
"cluster": {
"id": 4,
"label": "text",
"bbox": {
"l": 50.1,
"t": 243.9,
"r": 286.4,
"b": 444.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 252.9,
"r_x1": 129.2,
"r_y1": 252.9,
"r_x2": 129.2,
"r_y2": 243.9,
"r_x3": 62.1,
"r_y3": 243.9,
"coord_origin": "TOPLEFT"
},
"text": "Loss Functions.",
"orig": "Loss Functions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.5,
"r_y0": 252.9,
"r_x1": 286.4,
"r_y1": 252.9,
"r_x2": 286.4,
"r_y2": 244.0,
"r_x3": 134.5,
"r_y3": 244.0,
"coord_origin": "TOPLEFT"
},
"text": "We formulate a multi-task loss Eq. 2",
"orig": "We formulate a multi-task loss Eq. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 264.9,
"r_x1": 286.4,
"r_y1": 264.9,
"r_x2": 286.4,
"r_y2": 256.0,
"r_x3": 50.1,
"r_y3": 256.0,
"coord_origin": "TOPLEFT"
},
"text": "to train our network. The Cross-Entropy loss (denoted as",
"orig": "to train our network. The Cross-Entropy loss (denoted as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 276.6,
"r_x1": 56.8,
"r_y1": 276.6,
"r_x2": 56.8,
"r_y2": 267.8,
"r_x3": 50.1,
"r_y3": 267.8,
"coord_origin": "TOPLEFT"
},
"text": "l$_{s}$",
"orig": "l$_{s}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 57.3,
"r_y0": 276.9,
"r_x1": 135.4,
"r_y1": 276.9,
"r_x2": 135.4,
"r_y2": 268.0,
"r_x3": 57.3,
"r_y3": 268.0,
"coord_origin": "TOPLEFT"
},
"text": ") is used to train the",
"orig": ") is used to train the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.7,
"r_y0": 276.6,
"r_x1": 211.1,
"r_y1": 276.6,
"r_x2": 211.1,
"r_y2": 268.0,
"r_x3": 137.7,
"r_y3": 268.0,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 213.6,
"r_y0": 276.9,
"r_x1": 286.4,
"r_y1": 276.9,
"r_x2": 286.4,
"r_y2": 268.0,
"r_x3": 213.6,
"r_y3": 268.0,
"coord_origin": "TOPLEFT"
},
"text": "which predicts the",
"orig": "which predicts the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 288.8,
"r_x1": 158.8,
"r_y1": 288.8,
"r_x2": 158.8,
"r_y2": 279.9,
"r_x3": 50.1,
"r_y3": 279.9,
"coord_origin": "TOPLEFT"
},
"text": "structure tokens. As for the",
"orig": "structure tokens. As for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 161.3,
"r_y0": 288.6,
"r_x1": 238.8,
"r_y1": 288.6,
"r_x2": 238.8,
"r_y2": 280.0,
"r_x3": 161.3,
"r_y3": 280.0,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.5,
"r_y0": 288.8,
"r_x1": 286.4,
"r_y1": 288.8,
"r_x2": 286.4,
"r_y2": 279.9,
"r_x3": 241.5,
"r_y3": 279.9,
"coord_origin": "TOPLEFT"
},
"text": "it is trained",
"orig": "it is trained",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 300.8,
"r_x1": 211.4,
"r_y1": 300.8,
"r_x2": 211.4,
"r_y2": 291.9,
"r_x3": 50.1,
"r_y3": 291.9,
"coord_origin": "TOPLEFT"
},
"text": "with a combination of losses denoted as",
"orig": "with a combination of losses denoted as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 214.3,
"r_y0": 300.5,
"r_x1": 229.2,
"r_y1": 300.5,
"r_x2": 229.2,
"r_y2": 291.7,
"r_x3": 214.3,
"r_y3": 291.7,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.7,
"r_y0": 300.8,
"r_x1": 232.2,
"r_y1": 300.8,
"r_x2": 232.2,
"r_y2": 291.9,
"r_x3": 229.7,
"r_y3": 291.9,
"coord_origin": "TOPLEFT"
},
"text": ".",
"orig": ".",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 236.5,
"r_y0": 300.5,
"r_x1": 251.4,
"r_y1": 300.5,
"r_x2": 251.4,
"r_y2": 291.7,
"r_x3": 236.5,
"r_y3": 291.7,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 254.8,
"r_y0": 300.8,
"r_x1": 286.4,
"r_y1": 300.8,
"r_x2": 286.4,
"r_y2": 291.9,
"r_x3": 254.8,
"r_y3": 291.9,
"coord_origin": "TOPLEFT"
},
"text": "consists",
"orig": "consists",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 312.7,
"r_x1": 137.5,
"r_y1": 312.7,
"r_x2": 137.5,
"r_y2": 303.8,
"r_x3": 50.1,
"r_y3": 303.8,
"coord_origin": "TOPLEFT"
},
"text": "of the generally used",
"orig": "of the generally used",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 141.3,
"r_y0": 312.5,
"r_x1": 148.2,
"r_y1": 312.5,
"r_x2": 148.2,
"r_y2": 303.7,
"r_x3": 141.3,
"r_y3": 303.7,
"coord_origin": "TOPLEFT"
},
"text": "l$_{1}$",
"orig": "l$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 152.6,
"r_y0": 312.7,
"r_x1": 286.4,
"r_y1": 312.7,
"r_x2": 286.4,
"r_y2": 303.8,
"r_x3": 152.6,
"r_y3": 303.8,
"coord_origin": "TOPLEFT"
},
"text": "loss for object detection and the",
"orig": "loss for object detection and the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 324.7,
"r_x1": 89.7,
"r_y1": 324.7,
"r_x2": 89.7,
"r_y2": 315.8,
"r_x3": 50.1,
"r_y3": 315.8,
"coord_origin": "TOPLEFT"
},
"text": "IoU loss (",
"orig": "IoU loss (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.7,
"r_y0": 324.5,
"r_x1": 104.1,
"r_y1": 324.5,
"r_x2": 104.1,
"r_y2": 315.6,
"r_x3": 89.7,
"r_y3": 315.6,
"coord_origin": "TOPLEFT"
},
"text": "l$_{iou}$",
"orig": "l$_{iou}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 104.6,
"r_y0": 324.7,
"r_x1": 286.4,
"r_y1": 324.7,
"r_x2": 286.4,
"r_y2": 315.8,
"r_x3": 104.6,
"r_y3": 315.8,
"coord_origin": "TOPLEFT"
},
"text": ") to be scale invariant as explained in [25]. In",
"orig": ") to be scale invariant as explained in [25]. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 336.6,
"r_x1": 286.4,
"r_y1": 336.6,
"r_x2": 286.4,
"r_y2": 327.7,
"r_x3": 50.1,
"r_y3": 327.7,
"coord_origin": "TOPLEFT"
},
"text": "comparison to DETR, we do not use the Hungarian algo-",
"orig": "comparison to DETR, we do not use the Hungarian algo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 348.6,
"r_x1": 286.4,
"r_y1": 348.6,
"r_x2": 286.4,
"r_y2": 339.7,
"r_x3": 50.1,
"r_y3": 339.7,
"coord_origin": "TOPLEFT"
},
"text": "rithm [15] to match the predicted bounding boxes with the",
"orig": "rithm [15] to match the predicted bounding boxes with the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 360.5,
"r_x1": 286.4,
"r_y1": 360.5,
"r_x2": 286.4,
"r_y2": 351.6,
"r_x3": 50.1,
"r_y3": 351.6,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth boxes, as we have already achieved a one-to-",
"orig": "ground-truth boxes, as we have already achieved a one-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 372.5,
"r_x1": 286.4,
"r_y1": 372.5,
"r_x2": 286.4,
"r_y2": 363.6,
"r_x3": 50.1,
"r_y3": 363.6,
"coord_origin": "TOPLEFT"
},
"text": "one match through two steps: 1) Our token input sequence",
"orig": "one match through two steps: 1) Our token input sequence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 384.5,
"r_x1": 286.4,
"r_y1": 384.5,
"r_x2": 286.4,
"r_y2": 375.5,
"r_x3": 50.1,
"r_y3": 375.5,
"coord_origin": "TOPLEFT"
},
"text": "is naturally ordered, therefore the hidden states of the table",
"orig": "is naturally ordered, therefore the hidden states of the table",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 396.4,
"r_x1": 286.4,
"r_y1": 396.4,
"r_x2": 286.4,
"r_y2": 387.5,
"r_x3": 50.1,
"r_y3": 387.5,
"coord_origin": "TOPLEFT"
},
"text": "data cells are also in order when they are provided as in-",
"orig": "data cells are also in order when they are provided as in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 408.4,
"r_x1": 88.7,
"r_y1": 408.4,
"r_x2": 88.7,
"r_y2": 399.5,
"r_x3": 50.1,
"r_y3": 399.5,
"coord_origin": "TOPLEFT"
},
"text": "put to the",
"orig": "put to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.6,
"r_y0": 408.1,
"r_x1": 170.1,
"r_y1": 408.1,
"r_x2": 170.1,
"r_y2": 399.5,
"r_x3": 91.6,
"r_y3": 399.5,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 170.1,
"r_y0": 408.4,
"r_x1": 286.4,
"r_y1": 408.4,
"r_x2": 286.4,
"r_y2": 399.5,
"r_x3": 170.1,
"r_y3": 399.5,
"coord_origin": "TOPLEFT"
},
"text": ", and 2) Our bounding boxes",
"orig": ", and 2) Our bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 420.3,
"r_x1": 182.0,
"r_y1": 420.3,
"r_x2": 182.0,
"r_y2": 411.4,
"r_x3": 50.1,
"r_y3": 411.4,
"coord_origin": "TOPLEFT"
},
"text": "generation mechanism (see Sec.",
"orig": "generation mechanism (see Sec.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.1,
"r_y0": 420.3,
"r_x1": 197.7,
"r_y1": 420.3,
"r_x2": 197.7,
"r_y2": 411.4,
"r_x3": 189.1,
"r_y3": 411.4,
"coord_origin": "TOPLEFT"
},
"text": "3)",
"orig": "3)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.3,
"r_y0": 420.3,
"r_x1": 286.4,
"r_y1": 420.3,
"r_x2": 286.4,
"r_y2": 411.4,
"r_x3": 200.3,
"r_y3": 411.4,
"coord_origin": "TOPLEFT"
},
"text": "ensures a one-to-one",
"orig": "ensures a one-to-one",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 432.3,
"r_x1": 286.4,
"r_y1": 432.3,
"r_x2": 286.4,
"r_y2": 423.4,
"r_x3": 50.1,
"r_y3": 423.4,
"coord_origin": "TOPLEFT"
},
"text": "mapping between the cell content and its bounding box for",
"orig": "mapping between the cell content and its bounding box for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 444.2,
"r_x1": 158.3,
"r_y1": 444.2,
"r_x2": 158.3,
"r_y2": 435.3,
"r_x3": 50.1,
"r_y3": 435.3,
"coord_origin": "TOPLEFT"
},
"text": "all post-processed datasets.",
"orig": "all post-processed datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Loss Functions. We formulate a multi-task loss Eq. 2 to train our network. The Cross-Entropy loss (denoted as l$_{s}$ ) is used to train the Structure Decoder which predicts the structure tokens. As for the Cell BBox Decoder it is trained with a combination of losses denoted as l$_{box}$ . l$_{box}$ consists of the generally used l$_{1}$ loss for object detection and the IoU loss ( l$_{iou}$ ) to be scale invariant as explained in [25]. In comparison to DETR, we do not use the Hungarian algorithm [15] to match the predicted bounding boxes with the ground-truth boxes, as we have already achieved a one-toone match through two steps: 1) Our token input sequence is naturally ordered, therefore the hidden states of the table data cells are also in order when they are provided as input to the Cell BBox Decoder , and 2) Our bounding boxes generation mechanism (see Sec. 3) ensures a one-to-one mapping between the cell content and its bounding box for all post-processed datasets."
},
{
"label": "text",
"id": 11,
"page_no": 5,
"cluster": {
"id": 11,
"label": "text",
"bbox": {
"l": 50.1,
"t": 448.0,
"r": 286.4,
"b": 468.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 456.9,
"r_x1": 286.4,
"r_y1": 456.9,
"r_x2": 286.4,
"r_y2": 448.0,
"r_x3": 62.1,
"r_y3": 448.0,
"coord_origin": "TOPLEFT"
},
"text": "The loss used to train the TableFormer can be defined as",
"orig": "The loss used to train the TableFormer can be defined as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 468.9,
"r_x1": 91.4,
"r_y1": 468.9,
"r_x2": 91.4,
"r_y2": 460.0,
"r_x3": 50.1,
"r_y3": 460.0,
"coord_origin": "TOPLEFT"
},
"text": "following:",
"orig": "following:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The loss used to train the TableFormer can be defined as following:"
},
{
"label": "formula",
"id": 15,
"page_no": 5,
"cluster": {
"id": 15,
"label": "formula",
"bbox": {
"l": 124.3,
"t": 493.3,
"r": 286.4,
"b": 517.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.7,
"r_y0": 502.1,
"r_x1": 140.6,
"r_y1": 502.1,
"r_x2": 140.6,
"r_y2": 493.3,
"r_x3": 125.7,
"r_y3": 493.3,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.9,
"r_y0": 502.1,
"r_x1": 151.7,
"r_y1": 502.1,
"r_x2": 151.7,
"r_y2": 493.3,
"r_x3": 143.9,
"r_y3": 493.3,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 154.4,
"r_y0": 502.1,
"r_x1": 186.6,
"r_y1": 502.1,
"r_x2": 186.6,
"r_y2": 493.3,
"r_x3": 154.4,
"r_y3": 493.3,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{iou}$l$_{iou}$",
"orig": "\u03bb$_{iou}$l$_{iou}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.3,
"r_y0": 502.1,
"r_x1": 197.1,
"r_y1": 502.1,
"r_x2": 197.1,
"r_y2": 493.3,
"r_x3": 189.3,
"r_y3": 493.3,
"coord_origin": "TOPLEFT"
},
"text": "+",
"orig": "+",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 199.3,
"r_y0": 502.1,
"r_x1": 211.6,
"r_y1": 502.1,
"r_x2": 211.6,
"r_y2": 493.3,
"r_x3": 199.3,
"r_y3": 493.3,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{l}$$_{1}$",
"orig": "\u03bb$_{l}$$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 124.3,
"r_y0": 517.1,
"r_x1": 127.3,
"r_y1": 517.1,
"r_x2": 127.3,
"r_y2": 508.2,
"r_x3": 124.3,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "l",
"orig": "l",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 130.3,
"r_y0": 517.1,
"r_x1": 138.0,
"r_y1": 517.1,
"r_x2": 138.0,
"r_y2": 508.2,
"r_x3": 130.3,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.8,
"r_y0": 517.1,
"r_x1": 153.3,
"r_y1": 517.1,
"r_x2": 153.3,
"r_y2": 508.2,
"r_x3": 140.8,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "\u03bbl$_{s}$",
"orig": "\u03bbl$_{s}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 156.0,
"r_y0": 517.1,
"r_x1": 174.9,
"r_y1": 517.1,
"r_x2": 174.9,
"r_y2": 508.2,
"r_x3": 156.0,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "+ (1",
"orig": "+ (1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 177.1,
"r_y0": 517.1,
"r_x1": 184.8,
"r_y1": 517.1,
"r_x2": 184.8,
"r_y2": 507.7,
"r_x3": 177.1,
"r_y3": 507.7,
"coord_origin": "TOPLEFT"
},
"text": "\u2212",
"orig": "\u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.0,
"r_y0": 517.1,
"r_x1": 192.8,
"r_y1": 517.1,
"r_x2": 192.8,
"r_y2": 508.2,
"r_x3": 187.0,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 192.8,
"r_y0": 517.1,
"r_x1": 196.7,
"r_y1": 517.1,
"r_x2": 196.7,
"r_y2": 508.2,
"r_x3": 192.8,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.7,
"r_y0": 517.1,
"r_x1": 211.6,
"r_y1": 517.1,
"r_x2": 211.6,
"r_y2": 508.2,
"r_x3": 196.7,
"r_y3": 508.2,
"coord_origin": "TOPLEFT"
},
"text": "l$_{box}$",
"orig": "l$_{box}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.7,
"r_y0": 509.9,
"r_x1": 286.4,
"r_y1": 509.9,
"r_x2": 286.4,
"r_y2": 501.0,
"r_x3": 274.7,
"r_y3": 501.0,
"coord_origin": "TOPLEFT"
},
"text": "(1)",
"orig": "(1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "l$_{box}$ = \u03bb$_{iou}$l$_{iou}$ + \u03bb$_{l}$$_{1}$ l = \u03bbl$_{s}$ + (1 \u2212 \u03bb ) l$_{box}$ (1)"
},
{
"label": "text",
"id": 16,
"page_no": 5,
"cluster": {
"id": 16,
"label": "text",
"bbox": {
"l": 50.1,
"t": 530.6,
"r": 281.6,
"b": 540.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 540.2,
"r_x1": 74.5,
"r_y1": 540.2,
"r_x2": 74.5,
"r_y2": 531.3,
"r_x3": 50.1,
"r_y3": 531.3,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.9,
"r_y0": 540.0,
"r_x1": 82.8,
"r_y1": 540.0,
"r_x2": 82.8,
"r_y2": 531.1,
"r_x3": 76.9,
"r_y3": 531.1,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 85.5,
"r_y0": 540.0,
"r_x1": 92.2,
"r_y1": 540.0,
"r_x2": 92.2,
"r_y2": 530.6,
"r_x3": 85.5,
"r_y3": 530.6,
"coord_origin": "TOPLEFT"
},
"text": "\u2208",
"orig": "\u2208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 94.7,
"r_y0": 540.2,
"r_x1": 135.6,
"r_y1": 540.2,
"r_x2": 135.6,
"r_y2": 531.3,
"r_x3": 94.7,
"r_y3": 531.3,
"coord_origin": "TOPLEFT"
},
"text": "[0, 1], and",
"orig": "[0, 1], and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.1,
"r_y0": 540.0,
"r_x1": 172.6,
"r_y1": 540.0,
"r_x2": 172.6,
"r_y2": 531.1,
"r_x3": 138.1,
"r_y3": 531.1,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$",
"orig": "\u03bb$_{iou}$, \u03bb$_{l}$$_{1}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.9,
"r_y0": 540.0,
"r_x1": 192.5,
"r_y1": 540.0,
"r_x2": 192.5,
"r_y2": 530.6,
"r_x3": 175.9,
"r_y3": 530.6,
"coord_origin": "TOPLEFT"
},
"text": "\u2208$_{R}$",
"orig": "\u2208$_{R}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 195.0,
"r_y0": 540.2,
"r_x1": 281.6,
"r_y1": 540.2,
"r_x2": 281.6,
"r_y2": 531.3,
"r_x3": 195.0,
"r_y3": 531.3,
"coord_origin": "TOPLEFT"
},
"text": "are hyper-parameters.",
"orig": "are hyper-parameters.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "where \u03bb \u2208 [0, 1], and \u03bb$_{iou}$, \u03bb$_{l}$$_{1}$ \u2208$_{R}$ are hyper-parameters."
},
{
"label": "section_header",
"id": 12,
"page_no": 5,
"cluster": {
"id": 12,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 555.9,
"r": 172.0,
"b": 566.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 566.7,
"r_x1": 57.9,
"r_y1": 566.7,
"r_x2": 57.9,
"r_y2": 555.9,
"r_x3": 50.1,
"r_y3": 555.9,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.4,
"r_y0": 566.7,
"r_x1": 172.0,
"r_y1": 566.7,
"r_x2": 172.0,
"r_y2": 555.9,
"r_x3": 68.4,
"r_y3": 555.9,
"coord_origin": "TOPLEFT"
},
"text": "Experimental Results",
"orig": "Experimental Results",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5. Experimental Results"
},
{
"label": "section_header",
"id": 13,
"page_no": 5,
"cluster": {
"id": 13,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 576.3,
"r": 179.2,
"b": 586.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 586.1,
"r_x1": 64.7,
"r_y1": 586.1,
"r_x2": 64.7,
"r_y2": 576.3,
"r_x3": 50.1,
"r_y3": 576.3,
"coord_origin": "TOPLEFT"
},
"text": "5.1.",
"orig": "5.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.4,
"r_y0": 586.1,
"r_x1": 179.2,
"r_y1": 586.1,
"r_x2": 179.2,
"r_y2": 576.3,
"r_x3": 74.4,
"r_y3": 576.3,
"coord_origin": "TOPLEFT"
},
"text": "Implementation Details",
"orig": "Implementation Details",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5.1. Implementation Details"
},
{
"label": "text",
"id": 7,
"page_no": 5,
"cluster": {
"id": 7,
"label": "text",
"bbox": {
"l": 50.1,
"t": 595.7,
"r": 286.4,
"b": 640.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 604.6,
"r_x1": 203.0,
"r_y1": 604.6,
"r_x2": 203.0,
"r_y2": 595.7,
"r_x3": 62.1,
"r_y3": 595.7,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer uses ResNet-18 as the",
"orig": "TableFormer uses ResNet-18 as the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 205.4,
"r_y0": 604.4,
"r_x1": 286.4,
"r_y1": 604.4,
"r_x2": 286.4,
"r_y2": 595.8,
"r_x3": 205.4,
"r_y3": 595.8,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Net-",
"orig": "CNN Backbone Net-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 616.4,
"r_x1": 70.0,
"r_y1": 616.4,
"r_x2": 70.0,
"r_y2": 607.8,
"r_x3": 50.1,
"r_y3": 607.8,
"coord_origin": "TOPLEFT"
},
"text": "work",
"orig": "work",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 616.6,
"r_x1": 286.4,
"r_y1": 616.6,
"r_x2": 286.4,
"r_y2": 607.7,
"r_x3": 70.0,
"r_y3": 607.7,
"coord_origin": "TOPLEFT"
},
"text": ". The input images are resized to 448*448 pixels and",
"orig": ". The input images are resized to 448*448 pixels and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 628.6,
"r_x1": 286.4,
"r_y1": 628.6,
"r_x2": 286.4,
"r_y2": 619.6,
"r_x3": 50.1,
"r_y3": 619.6,
"coord_origin": "TOPLEFT"
},
"text": "the feature map has a dimension of 28*28. Additionally, we",
"orig": "the feature map has a dimension of 28*28. Additionally, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 640.5,
"r_x1": 207.0,
"r_y1": 640.5,
"r_x2": 207.0,
"r_y2": 631.6,
"r_x3": 50.1,
"r_y3": 631.6,
"coord_origin": "TOPLEFT"
},
"text": "enforce the following input constraints:",
"orig": "enforce the following input constraints:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TableFormer uses ResNet-18 as the CNN Backbone Network . The input images are resized to 448*448 pixels and the feature map has a dimension of 28*28. Additionally, we enforce the following input constraints:"
},
{
"label": "formula",
"id": 18,
"page_no": 5,
"cluster": {
"id": 18,
"label": "formula",
"bbox": {
"l": 91.7,
"t": 653.8,
"r": 286.4,
"b": 678.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.7,
"r_y0": 663.5,
"r_x1": 186.0,
"r_y1": 663.5,
"r_x2": 186.0,
"r_y2": 654.5,
"r_x3": 91.7,
"r_y3": 654.5,
"coord_origin": "TOPLEFT"
},
"text": "Image width and height",
"orig": "Image width and height",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.5,
"r_y0": 663.2,
"r_x1": 196.3,
"r_y1": 663.2,
"r_x2": 196.3,
"r_y2": 653.8,
"r_x3": 188.5,
"r_y3": 653.8,
"coord_origin": "TOPLEFT"
},
"text": "\u2264",
"orig": "\u2264",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 198.7,
"r_y0": 663.5,
"r_x1": 244.8,
"r_y1": 663.5,
"r_x2": 244.8,
"r_y2": 654.5,
"r_x3": 198.7,
"r_y3": 654.5,
"coord_origin": "TOPLEFT"
},
"text": "1024 pixels",
"orig": "1024 pixels",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.0,
"r_y0": 678.4,
"r_x1": 186.2,
"r_y1": 678.4,
"r_x2": 186.2,
"r_y2": 669.5,
"r_x3": 101.0,
"r_y3": 669.5,
"coord_origin": "TOPLEFT"
},
"text": "Structural tags length",
"orig": "Structural tags length",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 188.7,
"r_y0": 678.2,
"r_x1": 196.5,
"r_y1": 678.2,
"r_x2": 196.5,
"r_y2": 668.8,
"r_x3": 188.7,
"r_y3": 668.8,
"coord_origin": "TOPLEFT"
},
"text": "\u2264",
"orig": "\u2264",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 199.0,
"r_y0": 678.4,
"r_x1": 244.8,
"r_y1": 678.4,
"r_x2": 244.8,
"r_y2": 669.5,
"r_x3": 199.0,
"r_y3": 669.5,
"coord_origin": "TOPLEFT"
},
"text": "512 tokens.",
"orig": "512 tokens.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.7,
"r_y0": 671.0,
"r_x1": 286.4,
"r_y1": 671.0,
"r_x2": 286.4,
"r_y2": 662.1,
"r_x3": 274.7,
"r_y3": 662.1,
"coord_origin": "TOPLEFT"
},
"text": "(2)",
"orig": "(2)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Image width and height \u2264 1024 pixels Structural tags length \u2264 512 tokens. (2)"
},
{
"label": "text",
"id": 10,
"page_no": 5,
"cluster": {
"id": 10,
"label": "text",
"bbox": {
"l": 50.1,
"t": 692.3,
"r": 286.4,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "Although input constraints are used also by other methods,",
"orig": "Although input constraints are used also by other methods,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 286.4,
"r_y1": 713.2,
"r_x2": 286.4,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "such as EDD, ours are less restrictive due to the improved",
"orig": "such as EDD, ours are less restrictive due to the improved",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Although input constraints are used also by other methods, such as EDD, ours are less restrictive due to the improved"
},
{
"label": "text",
"id": 9,
"page_no": 5,
"cluster": {
"id": 9,
"label": "text",
"bbox": {
"l": 308.9,
"t": 75.2,
"r": 545.1,
"b": 108.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 84.1,
"r_x1": 545.1,
"r_y1": 84.1,
"r_x2": 545.1,
"r_y2": 75.2,
"r_x3": 308.9,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "runtime performance and lower memory footprint of Table-",
"orig": "runtime performance and lower memory footprint of Table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 96.1,
"r_x1": 340.0,
"r_y1": 96.1,
"r_x2": 340.0,
"r_y2": 87.2,
"r_x3": 308.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "Former.",
"orig": "Former.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.9,
"r_y0": 96.1,
"r_x1": 545.1,
"r_y1": 96.1,
"r_x2": 545.1,
"r_y2": 87.2,
"r_x3": 346.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "This allows to utilize input samples with longer",
"orig": "This allows to utilize input samples with longer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 108.0,
"r_x1": 493.0,
"r_y1": 108.0,
"r_x2": 493.0,
"r_y2": 99.1,
"r_x3": 308.9,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "sequences and images with larger dimensions.",
"orig": "sequences and images with larger dimensions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "runtime performance and lower memory footprint of TableFormer. This allows to utilize input samples with longer sequences and images with larger dimensions."
},
{
"label": "text",
"id": 1,
"page_no": 5,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 308.9,
"t": 116.2,
"r": 545.1,
"b": 328.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 125.1,
"r_x1": 545.1,
"r_y1": 125.1,
"r_x2": 545.1,
"r_y2": 116.2,
"r_x3": 320.8,
"r_y3": 116.2,
"coord_origin": "TOPLEFT"
},
"text": "The Transformer Encoder consists of two \u201cTransformer",
"orig": "The Transformer Encoder consists of two \u201cTransformer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 137.1,
"r_x1": 545.1,
"r_y1": 137.1,
"r_x2": 545.1,
"r_y2": 128.2,
"r_x3": 308.9,
"r_y3": 128.2,
"coord_origin": "TOPLEFT"
},
"text": "Encoder Layers\u201d, with an input feature size of 512, feed",
"orig": "Encoder Layers\u201d, with an input feature size of 512, feed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 149.0,
"r_x1": 545.1,
"r_y1": 149.0,
"r_x2": 545.1,
"r_y2": 140.1,
"r_x3": 308.9,
"r_y3": 140.1,
"coord_origin": "TOPLEFT"
},
"text": "forward network of 1024, and 4 attention heads. As for the",
"orig": "forward network of 1024, and 4 attention heads. As for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 161.0,
"r_x1": 545.1,
"r_y1": 161.0,
"r_x2": 545.1,
"r_y2": 152.1,
"r_x3": 308.9,
"r_y3": 152.1,
"coord_origin": "TOPLEFT"
},
"text": "Transformer Decoder it is composed of four \u201cTransformer",
"orig": "Transformer Decoder it is composed of four \u201cTransformer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 173.0,
"r_x1": 545.1,
"r_y1": 173.0,
"r_x2": 545.1,
"r_y2": 164.0,
"r_x3": 308.9,
"r_y3": 164.0,
"coord_origin": "TOPLEFT"
},
"text": "Decoder Layers\u201d with similar input and output dimensions",
"orig": "Decoder Layers\u201d with similar input and output dimensions",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 184.9,
"r_x1": 467.2,
"r_y1": 184.9,
"r_x2": 467.2,
"r_y2": 176.0,
"r_x3": 308.9,
"r_y3": 176.0,
"coord_origin": "TOPLEFT"
},
"text": "as the \u201cTransformer Encoder Layers\u201d.",
"orig": "as the \u201cTransformer Encoder Layers\u201d.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 475.4,
"r_y0": 184.9,
"r_x1": 545.1,
"r_y1": 184.9,
"r_x2": 545.1,
"r_y2": 176.0,
"r_x3": 475.4,
"r_y3": 176.0,
"coord_origin": "TOPLEFT"
},
"text": "Even though our",
"orig": "Even though our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 196.9,
"r_x1": 545.1,
"r_y1": 196.9,
"r_x2": 545.1,
"r_y2": 188.0,
"r_x3": 308.9,
"r_y3": 188.0,
"coord_origin": "TOPLEFT"
},
"text": "model uses fewer layers and heads than the default imple-",
"orig": "model uses fewer layers and heads than the default imple-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 208.8,
"r_x1": 545.1,
"r_y1": 208.8,
"r_x2": 545.1,
"r_y2": 199.9,
"r_x3": 308.9,
"r_y3": 199.9,
"coord_origin": "TOPLEFT"
},
"text": "mentation parameters, our extensive experimentation has",
"orig": "mentation parameters, our extensive experimentation has",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 220.8,
"r_x1": 545.1,
"r_y1": 220.8,
"r_x2": 545.1,
"r_y2": 211.9,
"r_x3": 308.9,
"r_y3": 211.9,
"coord_origin": "TOPLEFT"
},
"text": "proved this setup to be more suitable for table images. We",
"orig": "proved this setup to be more suitable for table images. We",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 232.7,
"r_x1": 545.1,
"r_y1": 232.7,
"r_x2": 545.1,
"r_y2": 223.8,
"r_x3": 308.9,
"r_y3": 223.8,
"coord_origin": "TOPLEFT"
},
"text": "attribute this finding to the inherent design of table im-",
"orig": "attribute this finding to the inherent design of table im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 244.7,
"r_x1": 545.1,
"r_y1": 244.7,
"r_x2": 545.1,
"r_y2": 235.8,
"r_x3": 308.9,
"r_y3": 235.8,
"coord_origin": "TOPLEFT"
},
"text": "ages, which contain mostly lines and text, unlike the more",
"orig": "ages, which contain mostly lines and text, unlike the more",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 256.6,
"r_x1": 545.1,
"r_y1": 256.6,
"r_x2": 545.1,
"r_y2": 247.7,
"r_x3": 308.9,
"r_y3": 247.7,
"coord_origin": "TOPLEFT"
},
"text": "elaborate content present in other scopes (e.g. the COCO",
"orig": "elaborate content present in other scopes (e.g. the COCO",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 268.6,
"r_x1": 342.3,
"r_y1": 268.6,
"r_x2": 342.3,
"r_y2": 259.7,
"r_x3": 308.9,
"r_y3": 259.7,
"coord_origin": "TOPLEFT"
},
"text": "dataset).",
"orig": "dataset).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 349.0,
"r_y0": 268.6,
"r_x1": 545.1,
"r_y1": 268.6,
"r_x2": 545.1,
"r_y2": 259.7,
"r_x3": 349.0,
"r_y3": 259.7,
"coord_origin": "TOPLEFT"
},
"text": "Moreover, we have added ResNet blocks to the",
"orig": "Moreover, we have added ResNet blocks to the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 280.6,
"r_x1": 545.1,
"r_y1": 280.6,
"r_x2": 545.1,
"r_y2": 271.6,
"r_x3": 308.9,
"r_y3": 271.6,
"coord_origin": "TOPLEFT"
},
"text": "inputs of the Structure Decoder and Cell BBox Decoder.",
"orig": "inputs of the Structure Decoder and Cell BBox Decoder.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 292.5,
"r_x1": 545.1,
"r_y1": 292.5,
"r_x2": 545.1,
"r_y2": 283.6,
"r_x3": 308.9,
"r_y3": 283.6,
"coord_origin": "TOPLEFT"
},
"text": "This prevents a decoder having a stronger influence over the",
"orig": "This prevents a decoder having a stronger influence over the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 304.5,
"r_x1": 545.1,
"r_y1": 304.5,
"r_x2": 545.1,
"r_y2": 295.6,
"r_x3": 308.9,
"r_y3": 295.6,
"coord_origin": "TOPLEFT"
},
"text": "learned weights which would damage the other prediction",
"orig": "learned weights which would damage the other prediction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 316.4,
"r_x1": 545.1,
"r_y1": 316.4,
"r_x2": 545.1,
"r_y2": 307.5,
"r_x3": 308.9,
"r_y3": 307.5,
"coord_origin": "TOPLEFT"
},
"text": "task (structure vs bounding boxes), but learn task specific",
"orig": "task (structure vs bounding boxes), but learn task specific",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 328.4,
"r_x1": 532.5,
"r_y1": 328.4,
"r_x2": 532.5,
"r_y2": 319.5,
"r_x3": 308.9,
"r_y3": 319.5,
"coord_origin": "TOPLEFT"
},
"text": "weights instead. Lastly our dropout layers are set to 0.5.",
"orig": "weights instead. Lastly our dropout layers are set to 0.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The Transformer Encoder consists of two \"Transformer Encoder Layers\", with an input feature size of 512, feed forward network of 1024, and 4 attention heads. As for the Transformer Decoder it is composed of four \"Transformer Decoder Layers\" with similar input and output dimensions as the \"Transformer Encoder Layers\". Even though our model uses fewer layers and heads than the default implementation parameters, our extensive experimentation has proved this setup to be more suitable for table images. We attribute this finding to the inherent design of table images, which contain mostly lines and text, unlike the more elaborate content present in other scopes (e.g. the COCO dataset). Moreover, we have added ResNet blocks to the inputs of the Structure Decoder and Cell BBox Decoder. This prevents a decoder having a stronger influence over the learned weights which would damage the other prediction task (structure vs bounding boxes), but learn task specific weights instead. Lastly our dropout layers are set to 0.5."
},
{
"label": "text",
"id": 3,
"page_no": 5,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 308.9,
"t": 336.6,
"r": 545.1,
"b": 429.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 345.5,
"r_x1": 545.1,
"r_y1": 345.5,
"r_x2": 545.1,
"r_y2": 336.6,
"r_x3": 320.8,
"r_y3": 336.6,
"coord_origin": "TOPLEFT"
},
"text": "For training, TableFormer is trained with 3 Adam opti-",
"orig": "For training, TableFormer is trained with 3 Adam opti-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 357.4,
"r_x1": 403.7,
"r_y1": 357.4,
"r_x2": 403.7,
"r_y2": 348.5,
"r_x3": 308.9,
"r_y3": 348.5,
"coord_origin": "TOPLEFT"
},
"text": "mizers, each one for the",
"orig": "mizers, each one for the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.1,
"r_y0": 357.2,
"r_x1": 503.5,
"r_y1": 357.2,
"r_x2": 503.5,
"r_y2": 348.6,
"r_x3": 406.1,
"r_y3": 348.6,
"coord_origin": "TOPLEFT"
},
"text": "CNN Backbone Network",
"orig": "CNN Backbone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 503.5,
"r_y0": 357.4,
"r_x1": 506.0,
"r_y1": 357.4,
"r_x2": 506.0,
"r_y2": 348.5,
"r_x3": 503.5,
"r_y3": 348.5,
"coord_origin": "TOPLEFT"
},
"text": ",",
"orig": ",",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.4,
"r_y0": 357.2,
"r_x1": 545.1,
"r_y1": 357.2,
"r_x2": 545.1,
"r_y2": 348.6,
"r_x3": 508.4,
"r_y3": 348.6,
"coord_origin": "TOPLEFT"
},
"text": "Structure",
"orig": "Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 369.2,
"r_x1": 343.2,
"r_y1": 369.2,
"r_x2": 343.2,
"r_y2": 360.6,
"r_x3": 308.9,
"r_y3": 360.6,
"coord_origin": "TOPLEFT"
},
"text": "Decoder",
"orig": "Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 343.2,
"r_y0": 369.4,
"r_x1": 362.2,
"r_y1": 369.4,
"r_x2": 362.2,
"r_y2": 360.5,
"r_x3": 343.2,
"r_y3": 360.5,
"coord_origin": "TOPLEFT"
},
"text": ", and",
"orig": ", and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 364.3,
"r_y0": 369.2,
"r_x1": 440.9,
"r_y1": 369.2,
"r_x2": 440.9,
"r_y2": 360.6,
"r_x3": 364.3,
"r_y3": 360.6,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 440.9,
"r_y0": 369.4,
"r_x1": 545.1,
"r_y1": 369.4,
"r_x2": 545.1,
"r_y2": 360.5,
"r_x3": 440.9,
"r_y3": 360.5,
"coord_origin": "TOPLEFT"
},
"text": ". Taking the PubTabNet as",
"orig": ". Taking the PubTabNet as",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 381.3,
"r_x1": 545.1,
"r_y1": 381.3,
"r_x2": 545.1,
"r_y2": 372.4,
"r_x3": 308.9,
"r_y3": 372.4,
"coord_origin": "TOPLEFT"
},
"text": "an example for our parameter set up, the initializing learn-",
"orig": "an example for our parameter set up, the initializing learn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 393.3,
"r_x1": 545.1,
"r_y1": 393.3,
"r_x2": 545.1,
"r_y2": 384.4,
"r_x3": 308.9,
"r_y3": 384.4,
"coord_origin": "TOPLEFT"
},
"text": "ing rate is 0.001 for 12 epochs with a batch size of 24, and",
"orig": "ing rate is 0.001 for 12 epochs with a batch size of 24, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 405.0,
"r_x1": 314.7,
"r_y1": 405.0,
"r_x2": 314.7,
"r_y2": 396.2,
"r_x3": 308.9,
"r_y3": 396.2,
"coord_origin": "TOPLEFT"
},
"text": "\u03bb",
"orig": "\u03bb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 318.7,
"r_y0": 405.3,
"r_x1": 360.4,
"r_y1": 405.3,
"r_x2": 360.4,
"r_y2": 396.4,
"r_x3": 318.7,
"r_y3": 396.4,
"coord_origin": "TOPLEFT"
},
"text": "set to 0.5.",
"orig": "set to 0.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 368.0,
"r_y0": 405.3,
"r_x1": 545.1,
"r_y1": 405.3,
"r_x2": 545.1,
"r_y2": 396.4,
"r_x3": 368.0,
"r_y3": 396.4,
"coord_origin": "TOPLEFT"
},
"text": "Afterwards, we reduce the learning rate to",
"orig": "Afterwards, we reduce the learning rate to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 417.2,
"r_x1": 545.1,
"r_y1": 417.2,
"r_x2": 545.1,
"r_y2": 408.3,
"r_x3": 308.9,
"r_y3": 408.3,
"coord_origin": "TOPLEFT"
},
"text": "0.0001, the batch size to 18 and train for 12 more epochs or",
"orig": "0.0001, the batch size to 18 and train for 12 more epochs or",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 429.2,
"r_x1": 361.0,
"r_y1": 429.2,
"r_x2": 361.0,
"r_y2": 420.3,
"r_x3": 308.9,
"r_y3": 420.3,
"coord_origin": "TOPLEFT"
},
"text": "convergence.",
"orig": "convergence.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "For training, TableFormer is trained with 3 Adam optimizers, each one for the CNN Backbone Network , Structure Decoder , and Cell BBox Decoder . Taking the PubTabNet as an example for our parameter set up, the initializing learning rate is 0.001 for 12 epochs with a batch size of 24, and \u03bb set to 0.5. Afterwards, we reduce the learning rate to 0.0001, the batch size to 18 and train for 12 more epochs or convergence."
},
{
"label": "text",
"id": 0,
"page_no": 5,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 308.9,
"t": 437.4,
"r": 545.1,
"b": 553.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 446.3,
"r_x1": 545.1,
"r_y1": 446.3,
"r_x2": 545.1,
"r_y2": 437.4,
"r_x3": 320.8,
"r_y3": 437.4,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer is implemented with PyTorch and Torchvi-",
"orig": "TableFormer is implemented with PyTorch and Torchvi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 458.2,
"r_x1": 384.6,
"r_y1": 458.2,
"r_x2": 384.6,
"r_y2": 449.3,
"r_x3": 308.9,
"r_y3": 449.3,
"coord_origin": "TOPLEFT"
},
"text": "sion libraries [22].",
"orig": "sion libraries [22].",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.4,
"r_y0": 458.2,
"r_x1": 545.1,
"r_y1": 458.2,
"r_x2": 545.1,
"r_y2": 449.3,
"r_x3": 391.4,
"r_y3": 449.3,
"coord_origin": "TOPLEFT"
},
"text": "To speed up the inference, the image",
"orig": "To speed up the inference, the image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 470.2,
"r_x1": 494.0,
"r_y1": 470.2,
"r_x2": 494.0,
"r_y2": 461.3,
"r_x3": 308.9,
"r_y3": 461.3,
"coord_origin": "TOPLEFT"
},
"text": "undergoes a single forward pass through the",
"orig": "undergoes a single forward pass through the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.1,
"r_y0": 470.0,
"r_x1": 545.1,
"r_y1": 470.0,
"r_x2": 545.1,
"r_y2": 461.4,
"r_x3": 498.1,
"r_y3": 461.4,
"coord_origin": "TOPLEFT"
},
"text": "CNN Back-",
"orig": "CNN Back-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 481.9,
"r_x1": 364.4,
"r_y1": 481.9,
"r_x2": 364.4,
"r_y2": 473.3,
"r_x3": 308.9,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "bone Network",
"orig": "bone Network",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.1,
"r_y0": 482.1,
"r_x1": 545.1,
"r_y1": 482.1,
"r_x2": 545.1,
"r_y2": 473.2,
"r_x3": 367.1,
"r_y3": 473.2,
"coord_origin": "TOPLEFT"
},
"text": "and transformer encoder. This eliminates the",
"orig": "and transformer encoder. This eliminates the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 494.1,
"r_x1": 545.1,
"r_y1": 494.1,
"r_x2": 545.1,
"r_y2": 485.2,
"r_x3": 308.9,
"r_y3": 485.2,
"coord_origin": "TOPLEFT"
},
"text": "overhead of generating the same features for each decoding",
"orig": "overhead of generating the same features for each decoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 506.1,
"r_x1": 545.1,
"r_y1": 506.1,
"r_x2": 545.1,
"r_y2": 497.1,
"r_x3": 308.9,
"r_y3": 497.1,
"coord_origin": "TOPLEFT"
},
"text": "step. Similarly, we employ a \u2019caching\u2019 technique to preform",
"orig": "step. Similarly, we employ a \u2019caching\u2019 technique to preform",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 518.0,
"r_x1": 545.1,
"r_y1": 518.0,
"r_x2": 545.1,
"r_y2": 509.1,
"r_x3": 308.9,
"r_y3": 509.1,
"coord_origin": "TOPLEFT"
},
"text": "faster autoregressive decoding. This is achieved by storing",
"orig": "faster autoregressive decoding. This is achieved by storing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 530.0,
"r_x1": 545.1,
"r_y1": 530.0,
"r_x2": 545.1,
"r_y2": 521.1,
"r_x3": 308.9,
"r_y3": 521.1,
"coord_origin": "TOPLEFT"
},
"text": "the features of decoded tokens so we can reuse them for",
"orig": "the features of decoded tokens so we can reuse them for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 541.9,
"r_x1": 545.1,
"r_y1": 541.9,
"r_x2": 545.1,
"r_y2": 533.0,
"r_x3": 308.9,
"r_y3": 533.0,
"coord_origin": "TOPLEFT"
},
"text": "each time step. Therefore, we only compute the attention",
"orig": "each time step. Therefore, we only compute the attention",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 553.9,
"r_x1": 377.2,
"r_y1": 553.9,
"r_x2": 377.2,
"r_y2": 545.0,
"r_x3": 308.9,
"r_y3": 545.0,
"coord_origin": "TOPLEFT"
},
"text": "for each new tag.",
"orig": "for each new tag.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TableFormer is implemented with PyTorch and Torchvision libraries [22]. To speed up the inference, the image undergoes a single forward pass through the CNN Backbone Network and transformer encoder. This eliminates the overhead of generating the same features for each decoding step. Similarly, we employ a 'caching' technique to preform faster autoregressive decoding. This is achieved by storing the features of decoded tokens so we can reuse them for each time step. Therefore, we only compute the attention for each new tag."
},
{
"label": "section_header",
"id": 14,
"page_no": 5,
"cluster": {
"id": 14,
"label": "section_header",
"bbox": {
"l": 308.9,
"t": 579.6,
"r": 397.4,
"b": 589.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 589.4,
"r_x1": 323.9,
"r_y1": 589.4,
"r_x2": 323.9,
"r_y2": 579.6,
"r_x3": 308.9,
"r_y3": 579.6,
"coord_origin": "TOPLEFT"
},
"text": "5.2.",
"orig": "5.2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.9,
"r_y0": 589.4,
"r_x1": 397.4,
"r_y1": 589.4,
"r_x2": 397.4,
"r_y2": 579.6,
"r_x3": 333.9,
"r_y3": 579.6,
"coord_origin": "TOPLEFT"
},
"text": "Generalization",
"orig": "Generalization",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5.2. Generalization"
},
{
"label": "text",
"id": 2,
"page_no": 5,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 308.9,
"t": 603.4,
"r": 545.1,
"b": 672.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 612.4,
"r_x1": 545.1,
"r_y1": 612.4,
"r_x2": 545.1,
"r_y2": 603.4,
"r_x3": 320.8,
"r_y3": 603.4,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer is evaluated on three major publicly avail-",
"orig": "TableFormer is evaluated on three major publicly avail-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 624.3,
"r_x1": 545.1,
"r_y1": 624.3,
"r_x2": 545.1,
"r_y2": 615.4,
"r_x3": 308.9,
"r_y3": 615.4,
"coord_origin": "TOPLEFT"
},
"text": "able datasets of different nature to prove the generalization",
"orig": "able datasets of different nature to prove the generalization",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 636.3,
"r_x1": 545.1,
"r_y1": 636.3,
"r_x2": 545.1,
"r_y2": 627.4,
"r_x3": 308.9,
"r_y3": 627.4,
"coord_origin": "TOPLEFT"
},
"text": "and effectiveness of our model. The datasets used for eval-",
"orig": "and effectiveness of our model. The datasets used for eval-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 648.2,
"r_x1": 545.1,
"r_y1": 648.2,
"r_x2": 545.1,
"r_y2": 639.3,
"r_x3": 308.9,
"r_y3": 639.3,
"coord_origin": "TOPLEFT"
},
"text": "uation are the PubTabNet, FinTabNet and TableBank which",
"orig": "uation are the PubTabNet, FinTabNet and TableBank which",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 660.2,
"r_x1": 545.1,
"r_y1": 660.2,
"r_x2": 545.1,
"r_y2": 651.3,
"r_x3": 308.9,
"r_y3": 651.3,
"coord_origin": "TOPLEFT"
},
"text": "stem from the scientific, financial and general domains re-",
"orig": "stem from the scientific, financial and general domains re-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 672.1,
"r_x1": 350.7,
"r_y1": 672.1,
"r_x2": 350.7,
"r_y2": 663.2,
"r_x3": 308.9,
"r_y3": 663.2,
"coord_origin": "TOPLEFT"
},
"text": "spectively.",
"orig": "spectively.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TableFormer is evaluated on three major publicly available datasets of different nature to prove the generalization and effectiveness of our model. The datasets used for evaluation are the PubTabNet, FinTabNet and TableBank which stem from the scientific, financial and general domains respectively."
},
{
"label": "text",
"id": 8,
"page_no": 5,
"cluster": {
"id": 8,
"label": "text",
"bbox": {
"l": 308.9,
"t": 680.3,
"r": 545.1,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 689.2,
"r_x1": 545.1,
"r_y1": 689.2,
"r_x2": 545.1,
"r_y2": 680.3,
"r_x3": 320.8,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "We also share our baseline results on the challenging",
"orig": "We also share our baseline results on the challenging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 701.2,
"r_x1": 396.2,
"r_y1": 701.2,
"r_x2": 396.2,
"r_y2": 692.3,
"r_x3": 308.9,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet dataset.",
"orig": "SynthTabNet dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.4,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 406.4,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "Throughout our experiments, the",
"orig": "Throughout our experiments, the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 495.9,
"r_y1": 713.2,
"r_x2": 495.9,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "same parameters stated in Sec. 5.1 are utilized.",
"orig": "same parameters stated in Sec. 5.1 are utilized.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "We also share our baseline results on the challenging SynthTabNet dataset. Throughout our experiments, the same parameters stated in Sec. 5.1 are utilized."
}
],
"headers": [
{
"label": "page_footer",
"id": 17,
"page_no": 5,
"cluster": {
"id": 17,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "6"
}
]
}
},
{
"page_no": 6,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.3,
"r_x1": 63.7,
"r_y1": 84.3,
"r_x2": 63.7,
"r_y2": 74.4,
"r_x3": 50.1,
"r_y3": 74.4,
"coord_origin": "TOPLEFT"
},
"text": "5.3.",
"orig": "5.3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 72.8,
"r_y0": 84.3,
"r_x1": 167.9,
"r_y1": 84.3,
"r_x2": 167.9,
"r_y2": 74.4,
"r_x3": 72.8,
"r_y3": 74.4,
"coord_origin": "TOPLEFT"
},
"text": "Datasets and Metrics",
"orig": "Datasets and Metrics",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 102.3,
"r_x1": 286.4,
"r_y1": 102.3,
"r_x2": 286.4,
"r_y2": 93.4,
"r_x3": 62.1,
"r_y3": 93.4,
"coord_origin": "TOPLEFT"
},
"text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-",
"orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 114.2,
"r_x1": 286.4,
"r_y1": 114.2,
"r_x2": 286.4,
"r_y2": 105.3,
"r_x3": 50.1,
"r_y3": 105.3,
"coord_origin": "TOPLEFT"
},
"text": "ric was introduced in [37]. It represents the prediction, and",
"orig": "ric was introduced in [37]. It represents the prediction, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 126.2,
"r_x1": 286.4,
"r_y1": 126.2,
"r_x2": 286.4,
"r_y2": 117.3,
"r_x3": 50.1,
"r_y3": 117.3,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth as a tree structure of HTML tags. This simi-",
"orig": "ground-truth as a tree structure of HTML tags. This simi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 138.1,
"r_x1": 136.7,
"r_y1": 138.1,
"r_x2": 136.7,
"r_y2": 129.2,
"r_x3": 50.1,
"r_y3": 129.2,
"coord_origin": "TOPLEFT"
},
"text": "larity is calculated as:",
"orig": "larity is calculated as:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.2,
"r_y0": 165.9,
"r_x1": 118.9,
"r_y1": 165.9,
"r_x2": 118.9,
"r_y2": 157.1,
"r_x3": 86.2,
"r_y3": 157.1,
"coord_origin": "TOPLEFT"
},
"text": "TEDS (",
"orig": "TEDS (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 118.9,
"r_y0": 165.9,
"r_x1": 143.3,
"r_y1": 165.9,
"r_x2": 143.3,
"r_y2": 157.1,
"r_x3": 118.9,
"r_y3": 157.1,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$, T$_{b}$",
"orig": "T$_{a}$, T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.8,
"r_y0": 165.9,
"r_x1": 165.9,
"r_y1": 165.9,
"r_x2": 165.9,
"r_y2": 157.1,
"r_x3": 143.8,
"r_y3": 157.1,
"coord_origin": "TOPLEFT"
},
"text": ") = 1",
"orig": ") = 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 168.1,
"r_y0": 165.9,
"r_x1": 175.9,
"r_y1": 165.9,
"r_x2": 175.9,
"r_y2": 156.5,
"r_x3": 168.1,
"r_y3": 156.5,
"coord_origin": "TOPLEFT"
},
"text": "\u2212",
"orig": "\u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 179.3,
"r_y0": 159.2,
"r_x1": 222.0,
"r_y1": 159.2,
"r_x2": 222.0,
"r_y2": 150.3,
"r_x3": 179.3,
"r_y3": 150.3,
"coord_origin": "TOPLEFT"
},
"text": "EditDist (",
"orig": "EditDist (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 222.0,
"r_y0": 159.2,
"r_x1": 246.3,
"r_y1": 159.2,
"r_x2": 246.3,
"r_y2": 150.3,
"r_x3": 222.0,
"r_y3": 150.3,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$, T$_{b}$",
"orig": "T$_{a}$, T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.8,
"r_y0": 159.2,
"r_x1": 250.7,
"r_y1": 159.2,
"r_x2": 250.7,
"r_y2": 150.3,
"r_x3": 246.8,
"r_y3": 150.3,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.2,
"r_y0": 172.7,
"r_x1": 206.3,
"r_y1": 172.7,
"r_x2": 206.3,
"r_y2": 163.9,
"r_x3": 182.2,
"r_y3": 163.9,
"coord_origin": "TOPLEFT"
},
"text": "max (",
"orig": "max (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.3,
"r_y0": 172.7,
"r_x1": 209.1,
"r_y1": 172.7,
"r_x2": 209.1,
"r_y2": 163.3,
"r_x3": 206.3,
"r_y3": 163.3,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.1,
"r_y0": 172.7,
"r_x1": 219.2,
"r_y1": 172.7,
"r_x2": 219.2,
"r_y2": 163.9,
"r_x3": 209.1,
"r_y3": 163.9,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$",
"orig": "T$_{a}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 219.7,
"r_y0": 172.7,
"r_x1": 222.5,
"r_y1": 172.7,
"r_x2": 222.5,
"r_y2": 163.3,
"r_x3": 219.7,
"r_y3": 163.3,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 224.1,
"r_y0": 172.7,
"r_x1": 226.9,
"r_y1": 172.7,
"r_x2": 226.9,
"r_y2": 163.9,
"r_x3": 224.1,
"r_y3": 163.9,
"coord_origin": "TOPLEFT"
},
"text": ",",
"orig": ",",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 228.6,
"r_y0": 172.7,
"r_x1": 231.3,
"r_y1": 172.7,
"r_x2": 231.3,
"r_y2": 163.3,
"r_x3": 228.6,
"r_y3": 163.3,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 231.3,
"r_y0": 172.7,
"r_x1": 240.6,
"r_y1": 172.7,
"r_x2": 240.6,
"r_y2": 163.9,
"r_x3": 231.3,
"r_y3": 163.9,
"coord_origin": "TOPLEFT"
},
"text": "T$_{b}$",
"orig": "T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.1,
"r_y0": 172.7,
"r_x1": 243.9,
"r_y1": 172.7,
"r_x2": 243.9,
"r_y2": 163.3,
"r_x3": 241.1,
"r_y3": 163.3,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 243.9,
"r_y0": 172.7,
"r_x1": 247.8,
"r_y1": 172.7,
"r_x2": 247.8,
"r_y2": 163.9,
"r_x3": 243.9,
"r_y3": 163.9,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.7,
"r_y0": 166.1,
"r_x1": 286.4,
"r_y1": 166.1,
"r_x2": 286.4,
"r_y2": 157.2,
"r_x3": 274.7,
"r_y3": 157.2,
"coord_origin": "TOPLEFT"
},
"text": "(3)",
"orig": "(3)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 190.1,
"r_x1": 86.4,
"r_y1": 190.1,
"r_x2": 86.4,
"r_y2": 181.2,
"r_x3": 62.1,
"r_y3": 181.2,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.6,
"r_y0": 189.8,
"r_x1": 98.7,
"r_y1": 189.8,
"r_x2": 98.7,
"r_y2": 181.0,
"r_x3": 88.6,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$",
"orig": "T$_{a}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.4,
"r_y0": 190.1,
"r_x1": 115.8,
"r_y1": 190.1,
"r_x2": 115.8,
"r_y2": 181.2,
"r_x3": 101.4,
"r_y3": 181.2,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 118.0,
"r_y0": 189.8,
"r_x1": 127.3,
"r_y1": 189.8,
"r_x2": 127.3,
"r_y2": 181.0,
"r_x3": 118.0,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "T$_{b}$",
"orig": "T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 130.0,
"r_y0": 190.1,
"r_x1": 286.4,
"r_y1": 190.1,
"r_x2": 286.4,
"r_y2": 181.2,
"r_x3": 130.0,
"r_y3": 181.2,
"coord_origin": "TOPLEFT"
},
"text": "represent tables in tree structure HTML",
"orig": "represent tables in tree structure HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 202.0,
"r_x1": 252.8,
"r_y1": 202.0,
"r_x2": 252.8,
"r_y2": 193.1,
"r_x3": 50.1,
"r_y3": 193.1,
"coord_origin": "TOPLEFT"
},
"text": "format. EditDist denotes the tree-edit distance, and",
"orig": "format. EditDist denotes the tree-edit distance, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.2,
"r_y0": 201.8,
"r_x1": 257.9,
"r_y1": 201.8,
"r_x2": 257.9,
"r_y2": 192.4,
"r_x3": 255.2,
"r_y3": 192.4,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 257.9,
"r_y0": 201.8,
"r_x1": 263.8,
"r_y1": 201.8,
"r_x2": 263.8,
"r_y2": 193.0,
"r_x3": 257.9,
"r_y3": 193.0,
"coord_origin": "TOPLEFT"
},
"text": "T",
"orig": "T",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 265.2,
"r_y0": 201.8,
"r_x1": 267.9,
"r_y1": 201.8,
"r_x2": 267.9,
"r_y2": 192.4,
"r_x3": 265.2,
"r_y3": 192.4,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 270.3,
"r_y0": 202.0,
"r_x1": 286.4,
"r_y1": 202.0,
"r_x2": 286.4,
"r_y2": 193.1,
"r_x3": 270.3,
"r_y3": 193.1,
"coord_origin": "TOPLEFT"
},
"text": "rep-",
"orig": "rep-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 214.0,
"r_x1": 172.1,
"r_y1": 214.0,
"r_x2": 172.1,
"r_y2": 205.1,
"r_x3": 50.1,
"r_y3": 205.1,
"coord_origin": "TOPLEFT"
},
"text": "resents the number of nodes in",
"orig": "resents the number of nodes in",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 174.6,
"r_y0": 213.8,
"r_x1": 180.4,
"r_y1": 213.8,
"r_x2": 180.4,
"r_y2": 204.9,
"r_x3": 174.6,
"r_y3": 204.9,
"coord_origin": "TOPLEFT"
},
"text": "T",
"orig": "T",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 181.8,
"r_y0": 214.0,
"r_x1": 184.3,
"r_y1": 214.0,
"r_x2": 184.3,
"r_y2": 205.1,
"r_x3": 181.8,
"r_y3": 205.1,
"coord_origin": "TOPLEFT"
},
"text": ".",
"orig": ".",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 234.7,
"r_x1": 64.6,
"r_y1": 234.7,
"r_x2": 64.6,
"r_y2": 224.8,
"r_x3": 50.1,
"r_y3": 224.8,
"coord_origin": "TOPLEFT"
},
"text": "5.4.",
"orig": "5.4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.2,
"r_y0": 234.7,
"r_x1": 170.5,
"r_y1": 234.7,
"r_x2": 170.5,
"r_y2": 224.8,
"r_x3": 74.2,
"r_y3": 224.8,
"coord_origin": "TOPLEFT"
},
"text": "Quantitative Analysis",
"orig": "Quantitative Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 252.6,
"r_x1": 105.3,
"r_y1": 252.6,
"r_x2": 105.3,
"r_y2": 243.6,
"r_x3": 62.1,
"r_y3": 243.6,
"coord_origin": "TOPLEFT"
},
"text": "Structure.",
"orig": "Structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.1,
"r_y0": 252.7,
"r_x1": 184.7,
"r_y1": 252.7,
"r_x2": 184.7,
"r_y2": 243.8,
"r_x3": 112.1,
"r_y3": 243.8,
"coord_origin": "TOPLEFT"
},
"text": "As shown in Tab.",
"orig": "As shown in Tab.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 191.5,
"r_y0": 252.7,
"r_x1": 286.4,
"r_y1": 252.7,
"r_x2": 286.4,
"r_y2": 243.8,
"r_x3": 191.5,
"r_y3": 243.8,
"coord_origin": "TOPLEFT"
},
"text": "2, TableFormer outper-",
"orig": "2, TableFormer outper-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 264.6,
"r_x1": 286.4,
"r_y1": 264.6,
"r_x2": 286.4,
"r_y2": 255.7,
"r_x3": 50.1,
"r_y3": 255.7,
"coord_origin": "TOPLEFT"
},
"text": "forms all SOTA methods across different datasets by a large",
"orig": "forms all SOTA methods across different datasets by a large",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 276.6,
"r_x1": 286.4,
"r_y1": 276.6,
"r_x2": 286.4,
"r_y2": 267.7,
"r_x3": 50.1,
"r_y3": 267.7,
"coord_origin": "TOPLEFT"
},
"text": "margin for predicting the table structure from an image.",
"orig": "margin for predicting the table structure from an image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 288.5,
"r_x1": 286.4,
"r_y1": 288.5,
"r_x2": 286.4,
"r_y2": 279.6,
"r_x3": 50.1,
"r_y3": 279.6,
"coord_origin": "TOPLEFT"
},
"text": "All the more, our model outperforms pre-trained methods.",
"orig": "All the more, our model outperforms pre-trained methods.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 300.5,
"r_x1": 286.4,
"r_y1": 300.5,
"r_x2": 286.4,
"r_y2": 291.6,
"r_x3": 50.1,
"r_y3": 291.6,
"coord_origin": "TOPLEFT"
},
"text": "During the evaluation we do not apply any table filtering.",
"orig": "During the evaluation we do not apply any table filtering.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 312.5,
"r_x1": 286.4,
"r_y1": 312.5,
"r_x2": 286.4,
"r_y2": 303.5,
"r_x3": 50.1,
"r_y3": 303.5,
"coord_origin": "TOPLEFT"
},
"text": "We also provide our baseline results on the SynthTabNet",
"orig": "We also provide our baseline results on the SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 324.4,
"r_x1": 286.4,
"r_y1": 324.4,
"r_x2": 286.4,
"r_y2": 315.5,
"r_x3": 50.1,
"r_y3": 315.5,
"coord_origin": "TOPLEFT"
},
"text": "dataset. It has been observed that large tables (e.g. tables",
"orig": "dataset. It has been observed that large tables (e.g. tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 336.4,
"r_x1": 286.4,
"r_y1": 336.4,
"r_x2": 286.4,
"r_y2": 327.5,
"r_x3": 50.1,
"r_y3": 327.5,
"coord_origin": "TOPLEFT"
},
"text": "that occupy half of the page or more) yield poor predictions.",
"orig": "that occupy half of the page or more) yield poor predictions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 348.3,
"r_x1": 286.4,
"r_y1": 348.3,
"r_x2": 286.4,
"r_y2": 339.4,
"r_x3": 50.1,
"r_y3": 339.4,
"coord_origin": "TOPLEFT"
},
"text": "We attribute this issue to the image resizing during the pre-",
"orig": "We attribute this issue to the image resizing during the pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 360.3,
"r_x1": 286.4,
"r_y1": 360.3,
"r_x2": 286.4,
"r_y2": 351.4,
"r_x3": 50.1,
"r_y3": 351.4,
"coord_origin": "TOPLEFT"
},
"text": "processing step, that produces downsampled images with",
"orig": "processing step, that produces downsampled images with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 372.2,
"r_x1": 286.4,
"r_y1": 372.2,
"r_x2": 286.4,
"r_y2": 363.3,
"r_x3": 50.1,
"r_y3": 363.3,
"coord_origin": "TOPLEFT"
},
"text": "indistinguishable features. This problem can be addressed",
"orig": "indistinguishable features. This problem can be addressed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 384.2,
"r_x1": 286.4,
"r_y1": 384.2,
"r_x2": 286.4,
"r_y2": 375.3,
"r_x3": 50.1,
"r_y3": 375.3,
"coord_origin": "TOPLEFT"
},
"text": "by treating such big tables with a separate model which ac-",
"orig": "by treating such big tables with a separate model which ac-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 396.1,
"r_x1": 170.0,
"r_y1": 396.1,
"r_x2": 170.0,
"r_y2": 387.2,
"r_x3": 50.1,
"r_y3": 387.2,
"coord_origin": "TOPLEFT"
},
"text": "cepts a large input image size.",
"orig": "cepts a large input image size.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.8,
"r_y0": 429.6,
"r_x1": 104.9,
"r_y1": 429.6,
"r_x2": 104.9,
"r_y2": 420.7,
"r_x3": 78.8,
"r_y3": 420.7,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.2,
"r_y0": 423.6,
"r_x1": 236.1,
"r_y1": 423.6,
"r_x2": 236.1,
"r_y2": 414.7,
"r_x3": 211.2,
"r_y3": 414.7,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 129.3,
"r_y0": 435.6,
"r_x1": 159.2,
"r_y1": 435.6,
"r_x2": 159.2,
"r_y2": 426.7,
"r_x3": 129.3,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.2,
"r_y0": 435.6,
"r_x1": 199.4,
"r_y1": 435.6,
"r_x2": 199.4,
"r_y2": 426.7,
"r_x3": 171.2,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.4,
"r_y0": 435.6,
"r_x1": 247.7,
"r_y1": 435.6,
"r_x2": 247.7,
"r_y2": 426.7,
"r_x3": 211.4,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 264.5,
"r_y0": 435.6,
"r_x1": 277.3,
"r_y1": 435.6,
"r_x2": 277.3,
"r_y2": 426.7,
"r_x3": 264.5,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 452.5,
"r_x1": 102.1,
"r_y1": 452.5,
"r_x2": 102.1,
"r_y2": 443.6,
"r_x3": 81.6,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 452.5,
"r_x1": 153.7,
"r_y1": 452.5,
"r_x2": 153.7,
"r_y2": 443.6,
"r_x3": 134.9,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 452.5,
"r_x1": 194.0,
"r_y1": 452.5,
"r_x2": 194.0,
"r_y2": 443.6,
"r_x3": 176.6,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "91.1",
"orig": "91.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 452.5,
"r_x1": 238.3,
"r_y1": 452.5,
"r_x2": 238.3,
"r_y2": 443.6,
"r_x3": 220.8,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "88.7",
"orig": "88.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 452.5,
"r_x1": 279.6,
"r_y1": 452.5,
"r_x2": 279.6,
"r_y2": 443.6,
"r_x3": 262.2,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "89.9",
"orig": "89.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.2,
"r_y0": 464.5,
"r_x1": 101.5,
"r_y1": 464.5,
"r_x2": 101.5,
"r_y2": 455.6,
"r_x3": 82.2,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 464.5,
"r_x1": 153.7,
"r_y1": 464.5,
"r_x2": 153.7,
"r_y2": 455.6,
"r_x3": 134.9,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 464.5,
"r_x1": 186.9,
"r_y1": 464.5,
"r_x2": 186.9,
"r_y2": 455.6,
"r_x3": 183.6,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 464.5,
"r_x1": 231.2,
"r_y1": 464.5,
"r_x2": 231.2,
"r_y2": 455.6,
"r_x3": 227.9,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 464.5,
"r_x1": 282.1,
"r_y1": 464.5,
"r_x2": 282.1,
"r_y2": 455.6,
"r_x3": 259.7,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "93.01",
"orig": "93.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 477.0,
"r_x1": 117.4,
"r_y1": 477.0,
"r_x2": 117.4,
"r_y2": 468.1,
"r_x3": 66.3,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 477.0,
"r_x1": 153.7,
"r_y1": 477.0,
"r_x2": 153.7,
"r_y2": 468.1,
"r_x3": 134.9,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 477.0,
"r_x1": 194.0,
"r_y1": 477.0,
"r_x2": 194.0,
"r_y2": 468.1,
"r_x3": 176.6,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "98.5",
"orig": "98.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 477.0,
"r_x1": 238.3,
"r_y1": 477.0,
"r_x2": 238.3,
"r_y2": 468.1,
"r_x3": 220.8,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "95.0",
"orig": "95.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 477.0,
"r_x1": 282.1,
"r_y1": 477.0,
"r_x2": 282.1,
"r_y2": 468.0,
"r_x3": 259.7,
"r_y3": 468.0,
"coord_origin": "TOPLEFT"
},
"text": "96.75",
"orig": "96.75",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 492.2,
"r_x1": 102.1,
"r_y1": 492.2,
"r_x2": 102.1,
"r_y2": 483.3,
"r_x3": 81.6,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 492.2,
"r_x1": 153.7,
"r_y1": 492.2,
"r_x2": 153.7,
"r_y2": 483.3,
"r_x3": 134.9,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 492.2,
"r_x1": 194.0,
"r_y1": 492.2,
"r_x2": 194.0,
"r_y2": 483.3,
"r_x3": 176.6,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "88.4",
"orig": "88.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.3,
"r_y0": 492.2,
"r_x1": 240.8,
"r_y1": 492.2,
"r_x2": 240.8,
"r_y2": 483.3,
"r_x3": 218.3,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "92.08",
"orig": "92.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 492.2,
"r_x1": 279.6,
"r_y1": 492.2,
"r_x2": 279.6,
"r_y2": 483.3,
"r_x3": 262.2,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "90.6",
"orig": "90.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.2,
"r_y0": 504.2,
"r_x1": 101.5,
"r_y1": 504.2,
"r_x2": 101.5,
"r_y2": 495.3,
"r_x3": 82.2,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 504.2,
"r_x1": 153.7,
"r_y1": 504.2,
"r_x2": 153.7,
"r_y2": 495.3,
"r_x3": 134.9,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 504.2,
"r_x1": 186.9,
"r_y1": 504.2,
"r_x2": 186.9,
"r_y2": 495.3,
"r_x3": 183.6,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 504.2,
"r_x1": 231.2,
"r_y1": 504.2,
"r_x2": 231.2,
"r_y2": 495.3,
"r_x3": 227.9,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 504.2,
"r_x1": 282.1,
"r_y1": 504.2,
"r_x2": 282.1,
"r_y2": 495.3,
"r_x3": 259.7,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "87.14",
"orig": "87.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.8,
"r_y0": 516.1,
"r_x1": 111.9,
"r_y1": 516.1,
"r_x2": 111.9,
"r_y2": 507.2,
"r_x3": 71.8,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "GTE (FT)",
"orig": "GTE (FT)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 516.1,
"r_x1": 153.7,
"r_y1": 516.1,
"r_x2": 153.7,
"r_y2": 507.2,
"r_x3": 134.9,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 516.1,
"r_x1": 186.9,
"r_y1": 516.1,
"r_x2": 186.9,
"r_y2": 507.2,
"r_x3": 183.6,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 516.1,
"r_x1": 231.2,
"r_y1": 516.1,
"r_x2": 231.2,
"r_y2": 507.2,
"r_x3": 227.9,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 516.1,
"r_x1": 282.1,
"r_y1": 516.1,
"r_x2": 282.1,
"r_y2": 507.2,
"r_x3": 259.7,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "91.02",
"orig": "91.02",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 528.1,
"r_x1": 117.4,
"r_y1": 528.1,
"r_x2": 117.4,
"r_y2": 519.2,
"r_x3": 66.3,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 528.1,
"r_x1": 153.7,
"r_y1": 528.1,
"r_x2": 153.7,
"r_y2": 519.2,
"r_x3": 134.9,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 528.1,
"r_x1": 194.0,
"r_y1": 528.1,
"r_x2": 194.0,
"r_y2": 519.2,
"r_x3": 176.6,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "97.5",
"orig": "97.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 528.1,
"r_x1": 238.3,
"r_y1": 528.1,
"r_x2": 238.3,
"r_y2": 519.2,
"r_x3": 220.8,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "96.0",
"orig": "96.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 528.0,
"r_x1": 279.6,
"r_y1": 528.0,
"r_x2": 279.6,
"r_y2": 519.1,
"r_x3": 262.2,
"r_y3": 519.1,
"coord_origin": "TOPLEFT"
},
"text": "96.8",
"orig": "96.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 545.4,
"r_x1": 102.1,
"r_y1": 545.4,
"r_x2": 102.1,
"r_y2": 536.5,
"r_x3": 81.6,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.9,
"r_y0": 545.4,
"r_x1": 150.6,
"r_y1": 545.4,
"r_x2": 150.6,
"r_y2": 536.5,
"r_x3": 137.9,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 545.4,
"r_x1": 194.0,
"r_y1": 545.4,
"r_x2": 194.0,
"r_y2": 536.5,
"r_x3": 176.6,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 545.4,
"r_x1": 231.2,
"r_y1": 545.4,
"r_x2": 231.2,
"r_y2": 536.5,
"r_x3": 227.9,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 545.4,
"r_x1": 279.6,
"r_y1": 545.4,
"r_x2": 279.6,
"r_y2": 536.5,
"r_x3": 262.2,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 557.4,
"r_x1": 117.4,
"r_y1": 557.4,
"r_x2": 117.4,
"r_y2": 548.5,
"r_x3": 66.3,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.9,
"r_y0": 557.4,
"r_x1": 150.6,
"r_y1": 557.4,
"r_x2": 150.6,
"r_y2": 548.5,
"r_x3": 137.9,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 557.4,
"r_x1": 194.0,
"r_y1": 557.4,
"r_x2": 194.0,
"r_y2": 548.5,
"r_x3": 176.6,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 557.4,
"r_x1": 231.2,
"r_y1": 557.4,
"r_x2": 231.2,
"r_y2": 548.5,
"r_x3": 227.9,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 557.3,
"r_x1": 279.6,
"r_y1": 557.3,
"r_x2": 279.6,
"r_y2": 548.3,
"r_x3": 262.2,
"r_y3": 548.3,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 576.9,
"r_x1": 117.4,
"r_y1": 576.9,
"r_x2": 117.4,
"r_y2": 568.0,
"r_x3": 66.3,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 576.9,
"r_x1": 153.7,
"r_y1": 576.9,
"r_x2": 153.7,
"r_y2": 568.0,
"r_x3": 134.9,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "STN",
"orig": "STN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 576.9,
"r_x1": 194.0,
"r_y1": 576.9,
"r_x2": 194.0,
"r_y2": 568.0,
"r_x3": 176.6,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.9",
"orig": "96.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 576.9,
"r_x1": 238.3,
"r_y1": 576.9,
"r_x2": 238.3,
"r_y2": 568.0,
"r_x3": 220.8,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "95.7",
"orig": "95.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 576.9,
"r_x1": 279.6,
"r_y1": 576.9,
"r_x2": 279.6,
"r_y2": 568.0,
"r_x3": 262.2,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.7",
"orig": "96.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 601.3,
"r_x1": 286.4,
"r_y1": 601.3,
"r_x2": 286.4,
"r_y2": 592.4,
"r_x3": 50.1,
"r_y3": 592.4,
"coord_origin": "TOPLEFT"
},
"text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet",
"orig": "Table 2: Structure results on PubTabNet (PTN), FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 613.3,
"r_x1": 247.5,
"r_y1": 613.3,
"r_x2": 247.5,
"r_y2": 604.4,
"r_x3": 50.1,
"r_y3": 604.4,
"coord_origin": "TOPLEFT"
},
"text": "(FTN), TableBank (TB) and SynthTabNet (STN).",
"orig": "(FTN), TableBank (TB) and SynthTabNet (STN).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 625.2,
"r_x1": 261.8,
"r_y1": 625.2,
"r_x2": 261.8,
"r_y2": 616.3,
"r_x3": 50.1,
"r_y3": 616.3,
"coord_origin": "TOPLEFT"
},
"text": "FT: Model was trained on PubTabNet then finetuned.",
"orig": "FT: Model was trained on PubTabNet then finetuned.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 653.3,
"r_x1": 124.7,
"r_y1": 653.3,
"r_x2": 124.7,
"r_y2": 644.3,
"r_x3": 62.1,
"r_y3": 644.3,
"coord_origin": "TOPLEFT"
},
"text": "Cell Detection.",
"orig": "Cell Detection.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 128.2,
"r_y0": 653.4,
"r_x1": 242.9,
"r_y1": 653.4,
"r_x2": 242.9,
"r_y2": 644.5,
"r_x3": 128.2,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "Like any object detector, our",
"orig": "Like any object detector, our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 245.6,
"r_y0": 653.1,
"r_x1": 286.4,
"r_y1": 653.1,
"r_x2": 286.4,
"r_y2": 644.6,
"r_x3": 245.6,
"r_y3": 644.6,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox",
"orig": "Cell BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 665.1,
"r_x1": 85.0,
"r_y1": 665.1,
"r_x2": 85.0,
"r_y2": 656.5,
"r_x3": 50.1,
"r_y3": 656.5,
"coord_origin": "TOPLEFT"
},
"text": "Detector",
"orig": "Detector",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.5,
"r_y0": 665.3,
"r_x1": 286.4,
"r_y1": 665.3,
"r_x2": 286.4,
"r_y2": 656.4,
"r_x3": 89.5,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "provides bounding boxes that can be improved",
"orig": "provides bounding boxes that can be improved",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.3,
"r_x1": 286.4,
"r_y1": 677.3,
"r_x2": 286.4,
"r_y2": 668.4,
"r_x3": 50.1,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "with post-processing during inference. We make use of the",
"orig": "with post-processing during inference. We make use of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 689.2,
"r_x1": 286.4,
"r_y1": 689.2,
"r_x2": 286.4,
"r_y2": 680.3,
"r_x3": 50.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "grid-like structure of tables to refine the predictions. A de-",
"orig": "grid-like structure of tables to refine the predictions. A de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "tailed explanation on the post-processing is available in the",
"orig": "tailed explanation on the post-processing is available in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 286.4,
"r_y1": 713.2,
"r_x2": 286.4,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "supplementary material. As shown in Tab. 3, we evaluate",
"orig": "supplementary material. As shown in Tab. 3, we evaluate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 84.1,
"r_x1": 322.1,
"r_y1": 84.1,
"r_x2": 322.1,
"r_y2": 75.2,
"r_x3": 308.9,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "our",
"orig": "our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 325.5,
"r_y0": 83.9,
"r_x1": 404.6,
"r_y1": 83.9,
"r_x2": 404.6,
"r_y2": 75.3,
"r_x3": 325.5,
"r_y3": 75.3,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.1,
"r_y0": 84.1,
"r_x1": 545.1,
"r_y1": 84.1,
"r_x2": 545.1,
"r_y2": 75.2,
"r_x3": 408.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "accuracy for cells with a class la-",
"orig": "accuracy for cells with a class la-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 96.1,
"r_x1": 545.1,
"r_y1": 96.1,
"r_x2": 545.1,
"r_y2": 87.2,
"r_x3": 308.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric",
"orig": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 108.0,
"r_x1": 470.2,
"r_y1": 108.0,
"r_x2": 470.2,
"r_y2": 99.1,
"r_x3": 308.9,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "for pre-processing and post-processing.",
"orig": "for pre-processing and post-processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.5,
"r_y0": 108.0,
"r_x1": 545.1,
"r_y1": 108.0,
"r_x2": 545.1,
"r_y2": 99.1,
"r_x3": 477.5,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "Note that we do",
"orig": "Note that we do",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 120.0,
"r_x1": 545.1,
"r_y1": 120.0,
"r_x2": 545.1,
"r_y2": 111.1,
"r_x3": 308.9,
"r_y3": 111.1,
"coord_origin": "TOPLEFT"
},
"text": "not have post-processing results for SynthTabNet as images",
"orig": "not have post-processing results for SynthTabNet as images",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 131.9,
"r_x1": 545.1,
"r_y1": 131.9,
"r_x2": 545.1,
"r_y2": 123.0,
"r_x3": 308.9,
"r_y3": 123.0,
"coord_origin": "TOPLEFT"
},
"text": "are only provided. To compare the performance of our pro-",
"orig": "are only provided. To compare the performance of our pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 143.9,
"r_x1": 502.0,
"r_y1": 143.9,
"r_x2": 502.0,
"r_y2": 135.0,
"r_x3": 308.9,
"r_y3": 135.0,
"coord_origin": "TOPLEFT"
},
"text": "posed approach, we\u2019ve integrated TableFormer\u2019s",
"orig": "posed approach, we\u2019ve integrated TableFormer\u2019s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 504.5,
"r_y0": 143.7,
"r_x1": 545.1,
"r_y1": 143.7,
"r_x2": 545.1,
"r_y2": 135.1,
"r_x3": 504.5,
"r_y3": 135.1,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox",
"orig": "Cell BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 155.6,
"r_x1": 343.2,
"r_y1": 155.6,
"r_x2": 343.2,
"r_y2": 147.0,
"r_x3": 308.9,
"r_y3": 147.0,
"coord_origin": "TOPLEFT"
},
"text": "Decoder",
"orig": "Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.4,
"r_y0": 155.8,
"r_x1": 545.1,
"r_y1": 155.8,
"r_x2": 545.1,
"r_y2": 146.9,
"r_x3": 346.4,
"r_y3": 146.9,
"coord_origin": "TOPLEFT"
},
"text": "into EDD architecture. As mentioned previously,",
"orig": "into EDD architecture. As mentioned previously,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 167.8,
"r_x1": 446.2,
"r_y1": 167.8,
"r_x2": 446.2,
"r_y2": 158.9,
"r_x3": 308.9,
"r_y3": 158.9,
"coord_origin": "TOPLEFT"
},
"text": "the Structure Decoder provides the",
"orig": "the Structure Decoder provides the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.3,
"r_y0": 167.6,
"r_x1": 525.0,
"r_y1": 167.6,
"r_x2": 525.0,
"r_y2": 159.0,
"r_x3": 448.3,
"r_y3": 159.0,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 527.4,
"r_y0": 167.8,
"r_x1": 545.1,
"r_y1": 167.8,
"r_x2": 545.1,
"r_y2": 158.9,
"r_x3": 527.4,
"r_y3": 158.9,
"coord_origin": "TOPLEFT"
},
"text": "with",
"orig": "with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 179.8,
"r_x1": 545.1,
"r_y1": 179.8,
"r_x2": 545.1,
"r_y2": 170.8,
"r_x3": 308.9,
"r_y3": 170.8,
"coord_origin": "TOPLEFT"
},
"text": "the features needed to predict the bounding box predictions.",
"orig": "the features needed to predict the bounding box predictions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 191.7,
"r_x1": 432.9,
"r_y1": 191.7,
"r_x2": 432.9,
"r_y2": 182.8,
"r_x3": 308.9,
"r_y3": 182.8,
"coord_origin": "TOPLEFT"
},
"text": "Therefore, the accuracy of the",
"orig": "Therefore, the accuracy of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 436.4,
"r_y0": 191.5,
"r_x1": 510.9,
"r_y1": 191.5,
"r_x2": 510.9,
"r_y2": 182.9,
"r_x3": 436.4,
"r_y3": 182.9,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.7,
"r_y0": 191.7,
"r_x1": 545.1,
"r_y1": 191.7,
"r_x2": 545.1,
"r_y2": 182.8,
"r_x3": 514.7,
"r_y3": 182.8,
"coord_origin": "TOPLEFT"
},
"text": "directly",
"orig": "directly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 203.7,
"r_x1": 431.2,
"r_y1": 203.7,
"r_x2": 431.2,
"r_y2": 194.8,
"r_x3": 308.9,
"r_y3": 194.8,
"coord_origin": "TOPLEFT"
},
"text": "influences the accuracy of the",
"orig": "influences the accuracy of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 434.7,
"r_y0": 203.4,
"r_x1": 514.2,
"r_y1": 203.4,
"r_x2": 514.2,
"r_y2": 194.8,
"r_x3": 434.7,
"r_y3": 194.8,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.2,
"r_y0": 203.7,
"r_x1": 545.1,
"r_y1": 203.7,
"r_x2": 545.1,
"r_y2": 194.8,
"r_x3": 514.2,
"r_y3": 194.8,
"coord_origin": "TOPLEFT"
},
"text": ". If the",
"orig": ". If the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 215.4,
"r_x1": 382.4,
"r_y1": 215.4,
"r_x2": 382.4,
"r_y2": 206.8,
"r_x3": 308.9,
"r_y3": 206.8,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.1,
"r_y0": 215.6,
"r_x1": 545.1,
"r_y1": 215.6,
"r_x2": 545.1,
"r_y2": 206.7,
"r_x3": 385.1,
"r_y3": 206.7,
"coord_origin": "TOPLEFT"
},
"text": "predicts an extra column, this will result",
"orig": "predicts an extra column, this will result",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 227.6,
"r_x1": 501.7,
"r_y1": 227.6,
"r_x2": 501.7,
"r_y2": 218.7,
"r_x3": 308.9,
"r_y3": 218.7,
"coord_origin": "TOPLEFT"
},
"text": "in an extra column of predicted bounding boxes.",
"orig": "in an extra column of predicted bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.3,
"r_y0": 262.6,
"r_x1": 365.3,
"r_y1": 262.6,
"r_x2": 365.3,
"r_y2": 253.7,
"r_x3": 339.3,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 401.0,
"r_y0": 262.6,
"r_x1": 430.9,
"r_y1": 262.6,
"r_x2": 430.9,
"r_y2": 253.7,
"r_x3": 401.0,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 454.1,
"r_y0": 262.6,
"r_x1": 474.6,
"r_y1": 262.6,
"r_x2": 474.6,
"r_y2": 253.7,
"r_x3": 454.1,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "mAP",
"orig": "mAP",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 486.5,
"r_y0": 262.6,
"r_x1": 527.2,
"r_y1": 262.6,
"r_x2": 527.2,
"r_y2": 253.7,
"r_x3": 486.5,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "mAP (PP)",
"orig": "mAP (PP)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.7,
"r_y0": 279.5,
"r_x1": 377.0,
"r_y1": 279.5,
"r_x2": 377.0,
"r_y2": 270.6,
"r_x3": 327.7,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "EDD+BBox",
"orig": "EDD+BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 279.5,
"r_x1": 438.3,
"r_y1": 279.5,
"r_x2": 438.3,
"r_y2": 270.6,
"r_x3": 393.7,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 279.5,
"r_x1": 473.1,
"r_y1": 279.5,
"r_x2": 473.1,
"r_y2": 270.6,
"r_x3": 455.6,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "79.2",
"orig": "79.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.2,
"r_y0": 279.5,
"r_x1": 515.6,
"r_y1": 279.5,
"r_x2": 515.6,
"r_y2": 270.6,
"r_x3": 498.2,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "82.7",
"orig": "82.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 291.5,
"r_x1": 377.9,
"r_y1": 291.5,
"r_x2": 377.9,
"r_y2": 282.6,
"r_x3": 326.8,
"r_y3": 282.6,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 291.5,
"r_x1": 438.3,
"r_y1": 291.5,
"r_x2": 438.3,
"r_y2": 282.6,
"r_x3": 393.7,
"r_y3": 282.6,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 291.4,
"r_x1": 473.1,
"r_y1": 291.4,
"r_x2": 473.1,
"r_y2": 282.5,
"r_x3": 455.6,
"r_y3": 282.5,
"coord_origin": "TOPLEFT"
},
"text": "82.1",
"orig": "82.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.2,
"r_y0": 291.4,
"r_x1": 515.6,
"r_y1": 291.4,
"r_x2": 515.6,
"r_y2": 282.5,
"r_x3": 498.2,
"r_y3": 282.5,
"coord_origin": "TOPLEFT"
},
"text": "86.8",
"orig": "86.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 303.4,
"r_x1": 377.9,
"r_y1": 303.4,
"r_x2": 377.9,
"r_y2": 294.5,
"r_x3": 326.8,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.8,
"r_y0": 303.4,
"r_x1": 442.2,
"r_y1": 303.4,
"r_x2": 442.2,
"r_y2": 294.5,
"r_x3": 389.8,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 303.4,
"r_x1": 473.1,
"r_y1": 303.4,
"r_x2": 473.1,
"r_y2": 294.5,
"r_x3": 455.6,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "87.7",
"orig": "87.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 505.2,
"r_y0": 303.4,
"r_x1": 508.5,
"r_y1": 303.4,
"r_x2": 508.5,
"r_y2": 294.5,
"r_x3": 505.2,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 325.4,
"r_x1": 341.5,
"r_y1": 325.4,
"r_x2": 341.5,
"r_y2": 316.4,
"r_x3": 308.9,
"r_y3": 316.4,
"coord_origin": "TOPLEFT"
},
"text": "Table 3:",
"orig": "Table 3:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.6,
"r_y0": 325.4,
"r_x1": 545.1,
"r_y1": 325.4,
"r_x2": 545.1,
"r_y2": 316.4,
"r_x3": 348.6,
"r_y3": 316.4,
"coord_origin": "TOPLEFT"
},
"text": "Cell Bounding Box detection results on PubTab-",
"orig": "Cell Bounding Box detection results on PubTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 337.3,
"r_x1": 475.0,
"r_y1": 337.3,
"r_x2": 475.0,
"r_y2": 328.4,
"r_x3": 308.9,
"r_y3": 328.4,
"coord_origin": "TOPLEFT"
},
"text": "Net, and FinTabNet. PP: Post-processing.",
"orig": "Net, and FinTabNet. PP: Post-processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 376.6,
"r_x1": 378.9,
"r_y1": 376.6,
"r_x2": 378.9,
"r_y2": 367.7,
"r_x3": 320.8,
"r_y3": 367.7,
"coord_origin": "TOPLEFT"
},
"text": "Cell Content.",
"orig": "Cell Content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 387.1,
"r_y0": 376.7,
"r_x1": 545.1,
"r_y1": 376.7,
"r_x2": 545.1,
"r_y2": 367.8,
"r_x3": 387.1,
"r_y3": 367.8,
"coord_origin": "TOPLEFT"
},
"text": "In this section, we evaluate the entire",
"orig": "In this section, we evaluate the entire",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 388.7,
"r_x1": 487.2,
"r_y1": 388.7,
"r_x2": 487.2,
"r_y2": 379.8,
"r_x3": 308.9,
"r_y3": 379.8,
"coord_origin": "TOPLEFT"
},
"text": "pipeline of recovering a table with content.",
"orig": "pipeline of recovering a table with content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 494.0,
"r_y0": 388.7,
"r_x1": 545.1,
"r_y1": 388.7,
"r_x2": 545.1,
"r_y2": 379.8,
"r_x3": 494.0,
"r_y3": 379.8,
"coord_origin": "TOPLEFT"
},
"text": "Here we put",
"orig": "Here we put",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 400.6,
"r_x1": 545.1,
"r_y1": 400.6,
"r_x2": 545.1,
"r_y2": 391.7,
"r_x3": 308.9,
"r_y3": 391.7,
"coord_origin": "TOPLEFT"
},
"text": "our approach to test by capitalizing on extracting content",
"orig": "our approach to test by capitalizing on extracting content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 412.6,
"r_x1": 545.1,
"r_y1": 412.6,
"r_x2": 545.1,
"r_y2": 403.7,
"r_x3": 308.9,
"r_y3": 403.7,
"coord_origin": "TOPLEFT"
},
"text": "from the PDF cells rather than decoding from images. Tab.",
"orig": "from the PDF cells rather than decoding from images. Tab.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 424.5,
"r_x1": 314.1,
"r_y1": 424.5,
"r_x2": 314.1,
"r_y2": 415.6,
"r_x3": 308.9,
"r_y3": 415.6,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.7,
"r_y0": 424.5,
"r_x1": 545.1,
"r_y1": 424.5,
"r_x2": 545.1,
"r_y2": 415.6,
"r_x3": 316.7,
"r_y3": 415.6,
"coord_origin": "TOPLEFT"
},
"text": "shows the TEDs score of HTML code representing the",
"orig": "shows the TEDs score of HTML code representing the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 436.5,
"r_x1": 545.1,
"r_y1": 436.5,
"r_x2": 545.1,
"r_y2": 427.6,
"r_x3": 308.9,
"r_y3": 427.6,
"coord_origin": "TOPLEFT"
},
"text": "structure of the table along with the content inserted in the",
"orig": "structure of the table along with the content inserted in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 448.4,
"r_x1": 545.1,
"r_y1": 448.4,
"r_x2": 545.1,
"r_y2": 439.5,
"r_x3": 308.9,
"r_y3": 439.5,
"coord_origin": "TOPLEFT"
},
"text": "data cell and compared with the ground-truth. Our method",
"orig": "data cell and compared with the ground-truth. Our method",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 460.4,
"r_x1": 350.2,
"r_y1": 460.4,
"r_x2": 350.2,
"r_y2": 451.5,
"r_x3": 308.9,
"r_y3": 451.5,
"coord_origin": "TOPLEFT"
},
"text": "achieved a",
"orig": "achieved a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.2,
"r_y0": 460.3,
"r_x1": 374.6,
"r_y1": 460.3,
"r_x2": 374.6,
"r_y2": 451.4,
"r_x3": 352.2,
"r_y3": 451.4,
"coord_origin": "TOPLEFT"
},
"text": "5.3%",
"orig": "5.3%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 376.5,
"r_y0": 460.4,
"r_x1": 545.1,
"r_y1": 460.4,
"r_x2": 545.1,
"r_y2": 451.5,
"r_x3": 376.5,
"r_y3": 451.5,
"coord_origin": "TOPLEFT"
},
"text": "increase over the state-of-the-art, and com-",
"orig": "increase over the state-of-the-art, and com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 472.3,
"r_x1": 545.1,
"r_y1": 472.3,
"r_x2": 545.1,
"r_y2": 463.4,
"r_x3": 308.9,
"r_y3": 463.4,
"coord_origin": "TOPLEFT"
},
"text": "mercial solutions. We believe our scores would be higher",
"orig": "mercial solutions. We believe our scores would be higher",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 484.3,
"r_x1": 545.1,
"r_y1": 484.3,
"r_x2": 545.1,
"r_y2": 475.4,
"r_x3": 308.9,
"r_y3": 475.4,
"coord_origin": "TOPLEFT"
},
"text": "if the HTML ground-truth matched the extracted PDF cell",
"orig": "if the HTML ground-truth matched the extracted PDF cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 496.3,
"r_x1": 545.1,
"r_y1": 496.3,
"r_x2": 545.1,
"r_y2": 487.4,
"r_x3": 308.9,
"r_y3": 487.4,
"coord_origin": "TOPLEFT"
},
"text": "content. Unfortunately, there are small discrepancies such",
"orig": "content. Unfortunately, there are small discrepancies such",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 508.2,
"r_x1": 545.1,
"r_y1": 508.2,
"r_x2": 545.1,
"r_y2": 499.3,
"r_x3": 308.9,
"r_y3": 499.3,
"coord_origin": "TOPLEFT"
},
"text": "as spacings around words or special characters with various",
"orig": "as spacings around words or special characters with various",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 520.2,
"r_x1": 405.7,
"r_y1": 520.2,
"r_x2": 405.7,
"r_y2": 511.3,
"r_x3": 308.9,
"r_y3": 511.3,
"coord_origin": "TOPLEFT"
},
"text": "unicode representations.",
"orig": "unicode representations.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 358.0,
"r_y0": 561.1,
"r_x1": 384.0,
"r_y1": 561.1,
"r_x2": 384.0,
"r_y2": 552.2,
"r_x3": 358.0,
"r_y3": 552.2,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.0,
"r_y0": 555.2,
"r_x1": 473.9,
"r_y1": 555.2,
"r_x2": 473.9,
"r_y2": 546.3,
"r_x3": 449.0,
"r_y3": 546.3,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.5,
"r_y0": 567.1,
"r_x1": 436.7,
"r_y1": 567.1,
"r_x2": 436.7,
"r_y2": 558.2,
"r_x3": 408.5,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.7,
"r_y0": 567.1,
"r_x1": 485.1,
"r_y1": 567.1,
"r_x2": 485.1,
"r_y2": 558.2,
"r_x3": 448.7,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.4,
"r_y0": 567.1,
"r_x1": 512.1,
"r_y1": 567.1,
"r_x2": 512.1,
"r_y2": 558.2,
"r_x3": 499.4,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.7,
"r_y0": 584.1,
"r_x1": 384.4,
"r_y1": 584.1,
"r_x2": 384.4,
"r_y2": 575.2,
"r_x3": 357.7,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "Tabula",
"orig": "Tabula",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 584.1,
"r_x1": 431.3,
"r_y1": 584.1,
"r_x2": 431.3,
"r_y2": 575.2,
"r_x3": 413.9,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "78.0",
"orig": "78.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 584.1,
"r_x1": 475.6,
"r_y1": 584.1,
"r_x2": 475.6,
"r_y2": 575.2,
"r_x3": 458.2,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "57.8",
"orig": "57.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 584.1,
"r_x1": 514.5,
"r_y1": 584.1,
"r_x2": 514.5,
"r_y2": 575.2,
"r_x3": 497.0,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "67.9",
"orig": "67.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 350.7,
"r_y0": 596.0,
"r_x1": 391.3,
"r_y1": 596.0,
"r_x2": 391.3,
"r_y2": 587.1,
"r_x3": 350.7,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "Traprange",
"orig": "Traprange",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 596.0,
"r_x1": 431.3,
"r_y1": 596.0,
"r_x2": 431.3,
"r_y2": 587.1,
"r_x3": 413.9,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "60.8",
"orig": "60.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 596.0,
"r_x1": 475.6,
"r_y1": 596.0,
"r_x2": 475.6,
"r_y2": 587.1,
"r_x3": 458.2,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "49.9",
"orig": "49.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 596.0,
"r_x1": 514.5,
"r_y1": 596.0,
"r_x2": 514.5,
"r_y2": 587.1,
"r_x3": 497.0,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "55.4",
"orig": "55.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.1,
"r_y0": 608.0,
"r_x1": 387.9,
"r_y1": 608.0,
"r_x2": 387.9,
"r_y2": 599.1,
"r_x3": 354.1,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "Camelot",
"orig": "Camelot",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 608.0,
"r_x1": 431.3,
"r_y1": 608.0,
"r_x2": 431.3,
"r_y2": 599.1,
"r_x3": 413.9,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "80.0",
"orig": "80.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 608.0,
"r_x1": 475.6,
"r_y1": 608.0,
"r_x2": 475.6,
"r_y2": 599.1,
"r_x3": 458.2,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "66.0",
"orig": "66.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 608.0,
"r_x1": 514.5,
"r_y1": 608.0,
"r_x2": 514.5,
"r_y2": 599.1,
"r_x3": 497.0,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "73.0",
"orig": "73.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.6,
"r_y0": 619.9,
"r_x1": 395.5,
"r_y1": 619.9,
"r_x2": 395.5,
"r_y2": 611.0,
"r_x3": 346.6,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "Acrobat Pro",
"orig": "Acrobat Pro",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 619.9,
"r_x1": 431.3,
"r_y1": 619.9,
"r_x2": 431.3,
"r_y2": 611.0,
"r_x3": 413.9,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "68.9",
"orig": "68.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 619.9,
"r_x1": 475.6,
"r_y1": 619.9,
"r_x2": 475.6,
"r_y2": 611.0,
"r_x3": 458.2,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "61.8",
"orig": "61.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 619.9,
"r_x1": 514.5,
"r_y1": 619.9,
"r_x2": 514.5,
"r_y2": 611.0,
"r_x3": 497.0,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "65.3",
"orig": "65.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.8,
"r_y0": 631.9,
"r_x1": 381.3,
"r_y1": 631.9,
"r_x2": 381.3,
"r_y2": 623.0,
"r_x3": 360.8,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 631.9,
"r_x1": 431.3,
"r_y1": 631.9,
"r_x2": 431.3,
"r_y2": 623.0,
"r_x3": 413.9,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "91.2",
"orig": "91.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 631.9,
"r_x1": 475.6,
"r_y1": 631.9,
"r_x2": 475.6,
"r_y2": 623.0,
"r_x3": 458.2,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "85.4",
"orig": "85.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 631.9,
"r_x1": 514.5,
"r_y1": 631.9,
"r_x2": 514.5,
"r_y2": 623.0,
"r_x3": 497.0,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "88.3",
"orig": "88.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.5,
"r_y0": 643.8,
"r_x1": 396.6,
"r_y1": 643.8,
"r_x2": 396.6,
"r_y2": 634.9,
"r_x3": 345.5,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 643.8,
"r_x1": 431.3,
"r_y1": 643.8,
"r_x2": 431.3,
"r_y2": 634.9,
"r_x3": 413.9,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "95.4",
"orig": "95.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 643.8,
"r_x1": 475.6,
"r_y1": 643.8,
"r_x2": 475.6,
"r_y2": 634.9,
"r_x3": 458.2,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "90.1",
"orig": "90.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 643.8,
"r_x1": 514.5,
"r_y1": 643.8,
"r_x2": 514.5,
"r_y2": 634.8,
"r_x3": 497.0,
"r_y3": 634.8,
"coord_origin": "TOPLEFT"
},
"text": "93.6",
"orig": "93.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 212,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 665.8,
"r_x1": 341.7,
"r_y1": 665.8,
"r_x2": 341.7,
"r_y2": 656.9,
"r_x3": 308.9,
"r_y3": 656.9,
"coord_origin": "TOPLEFT"
},
"text": "Table 4:",
"orig": "Table 4:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 213,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 349.6,
"r_y0": 665.8,
"r_x1": 545.1,
"r_y1": 665.8,
"r_x2": 545.1,
"r_y2": 656.9,
"r_x3": 349.6,
"r_y3": 656.9,
"coord_origin": "TOPLEFT"
},
"text": "Results of structure with content retrieved using",
"orig": "Results of structure with content retrieved using",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 214,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 677.7,
"r_x1": 545.1,
"r_y1": 677.7,
"r_x2": 545.1,
"r_y2": 668.8,
"r_x3": 308.9,
"r_y3": 668.8,
"coord_origin": "TOPLEFT"
},
"text": "cell detection on PubTabNet. In all cases the input is PDF",
"orig": "cell detection on PubTabNet. In all cases the input is PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 215,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 689.7,
"r_x1": 435.0,
"r_y1": 689.7,
"r_x2": 435.0,
"r_y2": 680.8,
"r_x3": 308.9,
"r_y3": 680.8,
"coord_origin": "TOPLEFT"
},
"text": "documents with cropped tables.",
"orig": "documents with cropped tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 216,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 10,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 74.4,
"r": 167.9,
"b": 84.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.3,
"r_x1": 63.7,
"r_y1": 84.3,
"r_x2": 63.7,
"r_y2": 74.4,
"r_x3": 50.1,
"r_y3": 74.4,
"coord_origin": "TOPLEFT"
},
"text": "5.3.",
"orig": "5.3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 72.8,
"r_y0": 84.3,
"r_x1": 167.9,
"r_y1": 84.3,
"r_x2": 167.9,
"r_y2": 74.4,
"r_x3": 72.8,
"r_y3": 74.4,
"coord_origin": "TOPLEFT"
},
"text": "Datasets and Metrics",
"orig": "Datasets and Metrics",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "text",
"bbox": {
"l": 50.1,
"t": 93.4,
"r": 286.4,
"b": 138.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 102.3,
"r_x1": 286.4,
"r_y1": 102.3,
"r_x2": 286.4,
"r_y2": 93.4,
"r_x3": 62.1,
"r_y3": 93.4,
"coord_origin": "TOPLEFT"
},
"text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-",
"orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 114.2,
"r_x1": 286.4,
"r_y1": 114.2,
"r_x2": 286.4,
"r_y2": 105.3,
"r_x3": 50.1,
"r_y3": 105.3,
"coord_origin": "TOPLEFT"
},
"text": "ric was introduced in [37]. It represents the prediction, and",
"orig": "ric was introduced in [37]. It represents the prediction, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 126.2,
"r_x1": 286.4,
"r_y1": 126.2,
"r_x2": 286.4,
"r_y2": 117.3,
"r_x3": 50.1,
"r_y3": 117.3,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth as a tree structure of HTML tags. This simi-",
"orig": "ground-truth as a tree structure of HTML tags. This simi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 138.1,
"r_x1": 136.7,
"r_y1": 138.1,
"r_x2": 136.7,
"r_y2": 129.2,
"r_x3": 50.1,
"r_y3": 129.2,
"coord_origin": "TOPLEFT"
},
"text": "larity is calculated as:",
"orig": "larity is calculated as:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 13,
"label": "formula",
"bbox": {
"l": 86.2,
"t": 150.3,
"r": 286.4,
"b": 172.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.2,
"r_y0": 165.9,
"r_x1": 118.9,
"r_y1": 165.9,
"r_x2": 118.9,
"r_y2": 157.1,
"r_x3": 86.2,
"r_y3": 157.1,
"coord_origin": "TOPLEFT"
},
"text": "TEDS (",
"orig": "TEDS (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 118.9,
"r_y0": 165.9,
"r_x1": 143.3,
"r_y1": 165.9,
"r_x2": 143.3,
"r_y2": 157.1,
"r_x3": 118.9,
"r_y3": 157.1,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$, T$_{b}$",
"orig": "T$_{a}$, T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.8,
"r_y0": 165.9,
"r_x1": 165.9,
"r_y1": 165.9,
"r_x2": 165.9,
"r_y2": 157.1,
"r_x3": 143.8,
"r_y3": 157.1,
"coord_origin": "TOPLEFT"
},
"text": ") = 1",
"orig": ") = 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 168.1,
"r_y0": 165.9,
"r_x1": 175.9,
"r_y1": 165.9,
"r_x2": 175.9,
"r_y2": 156.5,
"r_x3": 168.1,
"r_y3": 156.5,
"coord_origin": "TOPLEFT"
},
"text": "\u2212",
"orig": "\u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 179.3,
"r_y0": 159.2,
"r_x1": 222.0,
"r_y1": 159.2,
"r_x2": 222.0,
"r_y2": 150.3,
"r_x3": 179.3,
"r_y3": 150.3,
"coord_origin": "TOPLEFT"
},
"text": "EditDist (",
"orig": "EditDist (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 222.0,
"r_y0": 159.2,
"r_x1": 246.3,
"r_y1": 159.2,
"r_x2": 246.3,
"r_y2": 150.3,
"r_x3": 222.0,
"r_y3": 150.3,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$, T$_{b}$",
"orig": "T$_{a}$, T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.8,
"r_y0": 159.2,
"r_x1": 250.7,
"r_y1": 159.2,
"r_x2": 250.7,
"r_y2": 150.3,
"r_x3": 246.8,
"r_y3": 150.3,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.2,
"r_y0": 172.7,
"r_x1": 206.3,
"r_y1": 172.7,
"r_x2": 206.3,
"r_y2": 163.9,
"r_x3": 182.2,
"r_y3": 163.9,
"coord_origin": "TOPLEFT"
},
"text": "max (",
"orig": "max (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.3,
"r_y0": 172.7,
"r_x1": 209.1,
"r_y1": 172.7,
"r_x2": 209.1,
"r_y2": 163.3,
"r_x3": 206.3,
"r_y3": 163.3,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.1,
"r_y0": 172.7,
"r_x1": 219.2,
"r_y1": 172.7,
"r_x2": 219.2,
"r_y2": 163.9,
"r_x3": 209.1,
"r_y3": 163.9,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$",
"orig": "T$_{a}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 219.7,
"r_y0": 172.7,
"r_x1": 222.5,
"r_y1": 172.7,
"r_x2": 222.5,
"r_y2": 163.3,
"r_x3": 219.7,
"r_y3": 163.3,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 224.1,
"r_y0": 172.7,
"r_x1": 226.9,
"r_y1": 172.7,
"r_x2": 226.9,
"r_y2": 163.9,
"r_x3": 224.1,
"r_y3": 163.9,
"coord_origin": "TOPLEFT"
},
"text": ",",
"orig": ",",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 228.6,
"r_y0": 172.7,
"r_x1": 231.3,
"r_y1": 172.7,
"r_x2": 231.3,
"r_y2": 163.3,
"r_x3": 228.6,
"r_y3": 163.3,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 231.3,
"r_y0": 172.7,
"r_x1": 240.6,
"r_y1": 172.7,
"r_x2": 240.6,
"r_y2": 163.9,
"r_x3": 231.3,
"r_y3": 163.9,
"coord_origin": "TOPLEFT"
},
"text": "T$_{b}$",
"orig": "T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.1,
"r_y0": 172.7,
"r_x1": 243.9,
"r_y1": 172.7,
"r_x2": 243.9,
"r_y2": 163.3,
"r_x3": 241.1,
"r_y3": 163.3,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 243.9,
"r_y0": 172.7,
"r_x1": 247.8,
"r_y1": 172.7,
"r_x2": 247.8,
"r_y2": 163.9,
"r_x3": 243.9,
"r_y3": 163.9,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.7,
"r_y0": 166.1,
"r_x1": 286.4,
"r_y1": 166.1,
"r_x2": 286.4,
"r_y2": 157.2,
"r_x3": 274.7,
"r_y3": 157.2,
"coord_origin": "TOPLEFT"
},
"text": "(3)",
"orig": "(3)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 6,
"label": "text",
"bbox": {
"l": 50.1,
"t": 181.0,
"r": 286.4,
"b": 214.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 190.1,
"r_x1": 86.4,
"r_y1": 190.1,
"r_x2": 86.4,
"r_y2": 181.2,
"r_x3": 62.1,
"r_y3": 181.2,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.6,
"r_y0": 189.8,
"r_x1": 98.7,
"r_y1": 189.8,
"r_x2": 98.7,
"r_y2": 181.0,
"r_x3": 88.6,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$",
"orig": "T$_{a}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.4,
"r_y0": 190.1,
"r_x1": 115.8,
"r_y1": 190.1,
"r_x2": 115.8,
"r_y2": 181.2,
"r_x3": 101.4,
"r_y3": 181.2,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 118.0,
"r_y0": 189.8,
"r_x1": 127.3,
"r_y1": 189.8,
"r_x2": 127.3,
"r_y2": 181.0,
"r_x3": 118.0,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "T$_{b}$",
"orig": "T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 130.0,
"r_y0": 190.1,
"r_x1": 286.4,
"r_y1": 190.1,
"r_x2": 286.4,
"r_y2": 181.2,
"r_x3": 130.0,
"r_y3": 181.2,
"coord_origin": "TOPLEFT"
},
"text": "represent tables in tree structure HTML",
"orig": "represent tables in tree structure HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 202.0,
"r_x1": 252.8,
"r_y1": 202.0,
"r_x2": 252.8,
"r_y2": 193.1,
"r_x3": 50.1,
"r_y3": 193.1,
"coord_origin": "TOPLEFT"
},
"text": "format. EditDist denotes the tree-edit distance, and",
"orig": "format. EditDist denotes the tree-edit distance, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.2,
"r_y0": 201.8,
"r_x1": 257.9,
"r_y1": 201.8,
"r_x2": 257.9,
"r_y2": 192.4,
"r_x3": 255.2,
"r_y3": 192.4,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 257.9,
"r_y0": 201.8,
"r_x1": 263.8,
"r_y1": 201.8,
"r_x2": 263.8,
"r_y2": 193.0,
"r_x3": 257.9,
"r_y3": 193.0,
"coord_origin": "TOPLEFT"
},
"text": "T",
"orig": "T",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 265.2,
"r_y0": 201.8,
"r_x1": 267.9,
"r_y1": 201.8,
"r_x2": 267.9,
"r_y2": 192.4,
"r_x3": 265.2,
"r_y3": 192.4,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 270.3,
"r_y0": 202.0,
"r_x1": 286.4,
"r_y1": 202.0,
"r_x2": 286.4,
"r_y2": 193.1,
"r_x3": 270.3,
"r_y3": 193.1,
"coord_origin": "TOPLEFT"
},
"text": "rep-",
"orig": "rep-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 214.0,
"r_x1": 172.1,
"r_y1": 214.0,
"r_x2": 172.1,
"r_y2": 205.1,
"r_x3": 50.1,
"r_y3": 205.1,
"coord_origin": "TOPLEFT"
},
"text": "resents the number of nodes in",
"orig": "resents the number of nodes in",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 174.6,
"r_y0": 213.8,
"r_x1": 180.4,
"r_y1": 213.8,
"r_x2": 180.4,
"r_y2": 204.9,
"r_x3": 174.6,
"r_y3": 204.9,
"coord_origin": "TOPLEFT"
},
"text": "T",
"orig": "T",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 181.8,
"r_y0": 214.0,
"r_x1": 184.3,
"r_y1": 214.0,
"r_x2": 184.3,
"r_y2": 205.1,
"r_x3": 181.8,
"r_y3": 205.1,
"coord_origin": "TOPLEFT"
},
"text": ".",
"orig": ".",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 9,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 224.8,
"r": 170.5,
"b": 234.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 234.7,
"r_x1": 64.6,
"r_y1": 234.7,
"r_x2": 64.6,
"r_y2": 224.8,
"r_x3": 50.1,
"r_y3": 224.8,
"coord_origin": "TOPLEFT"
},
"text": "5.4.",
"orig": "5.4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.2,
"r_y0": 234.7,
"r_x1": 170.5,
"r_y1": 234.7,
"r_x2": 170.5,
"r_y2": 224.8,
"r_x3": 74.2,
"r_y3": 224.8,
"coord_origin": "TOPLEFT"
},
"text": "Quantitative Analysis",
"orig": "Quantitative Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "text",
"bbox": {
"l": 50.1,
"t": 243.6,
"r": 286.4,
"b": 396.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 252.6,
"r_x1": 105.3,
"r_y1": 252.6,
"r_x2": 105.3,
"r_y2": 243.6,
"r_x3": 62.1,
"r_y3": 243.6,
"coord_origin": "TOPLEFT"
},
"text": "Structure.",
"orig": "Structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.1,
"r_y0": 252.7,
"r_x1": 184.7,
"r_y1": 252.7,
"r_x2": 184.7,
"r_y2": 243.8,
"r_x3": 112.1,
"r_y3": 243.8,
"coord_origin": "TOPLEFT"
},
"text": "As shown in Tab.",
"orig": "As shown in Tab.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 191.5,
"r_y0": 252.7,
"r_x1": 286.4,
"r_y1": 252.7,
"r_x2": 286.4,
"r_y2": 243.8,
"r_x3": 191.5,
"r_y3": 243.8,
"coord_origin": "TOPLEFT"
},
"text": "2, TableFormer outper-",
"orig": "2, TableFormer outper-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 264.6,
"r_x1": 286.4,
"r_y1": 264.6,
"r_x2": 286.4,
"r_y2": 255.7,
"r_x3": 50.1,
"r_y3": 255.7,
"coord_origin": "TOPLEFT"
},
"text": "forms all SOTA methods across different datasets by a large",
"orig": "forms all SOTA methods across different datasets by a large",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 276.6,
"r_x1": 286.4,
"r_y1": 276.6,
"r_x2": 286.4,
"r_y2": 267.7,
"r_x3": 50.1,
"r_y3": 267.7,
"coord_origin": "TOPLEFT"
},
"text": "margin for predicting the table structure from an image.",
"orig": "margin for predicting the table structure from an image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 288.5,
"r_x1": 286.4,
"r_y1": 288.5,
"r_x2": 286.4,
"r_y2": 279.6,
"r_x3": 50.1,
"r_y3": 279.6,
"coord_origin": "TOPLEFT"
},
"text": "All the more, our model outperforms pre-trained methods.",
"orig": "All the more, our model outperforms pre-trained methods.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 300.5,
"r_x1": 286.4,
"r_y1": 300.5,
"r_x2": 286.4,
"r_y2": 291.6,
"r_x3": 50.1,
"r_y3": 291.6,
"coord_origin": "TOPLEFT"
},
"text": "During the evaluation we do not apply any table filtering.",
"orig": "During the evaluation we do not apply any table filtering.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 312.5,
"r_x1": 286.4,
"r_y1": 312.5,
"r_x2": 286.4,
"r_y2": 303.5,
"r_x3": 50.1,
"r_y3": 303.5,
"coord_origin": "TOPLEFT"
},
"text": "We also provide our baseline results on the SynthTabNet",
"orig": "We also provide our baseline results on the SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 324.4,
"r_x1": 286.4,
"r_y1": 324.4,
"r_x2": 286.4,
"r_y2": 315.5,
"r_x3": 50.1,
"r_y3": 315.5,
"coord_origin": "TOPLEFT"
},
"text": "dataset. It has been observed that large tables (e.g. tables",
"orig": "dataset. It has been observed that large tables (e.g. tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 336.4,
"r_x1": 286.4,
"r_y1": 336.4,
"r_x2": 286.4,
"r_y2": 327.5,
"r_x3": 50.1,
"r_y3": 327.5,
"coord_origin": "TOPLEFT"
},
"text": "that occupy half of the page or more) yield poor predictions.",
"orig": "that occupy half of the page or more) yield poor predictions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 348.3,
"r_x1": 286.4,
"r_y1": 348.3,
"r_x2": 286.4,
"r_y2": 339.4,
"r_x3": 50.1,
"r_y3": 339.4,
"coord_origin": "TOPLEFT"
},
"text": "We attribute this issue to the image resizing during the pre-",
"orig": "We attribute this issue to the image resizing during the pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 360.3,
"r_x1": 286.4,
"r_y1": 360.3,
"r_x2": 286.4,
"r_y2": 351.4,
"r_x3": 50.1,
"r_y3": 351.4,
"coord_origin": "TOPLEFT"
},
"text": "processing step, that produces downsampled images with",
"orig": "processing step, that produces downsampled images with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 372.2,
"r_x1": 286.4,
"r_y1": 372.2,
"r_x2": 286.4,
"r_y2": 363.3,
"r_x3": 50.1,
"r_y3": 363.3,
"coord_origin": "TOPLEFT"
},
"text": "indistinguishable features. This problem can be addressed",
"orig": "indistinguishable features. This problem can be addressed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 384.2,
"r_x1": 286.4,
"r_y1": 384.2,
"r_x2": 286.4,
"r_y2": 375.3,
"r_x3": 50.1,
"r_y3": 375.3,
"coord_origin": "TOPLEFT"
},
"text": "by treating such big tables with a separate model which ac-",
"orig": "by treating such big tables with a separate model which ac-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 396.1,
"r_x1": 170.0,
"r_y1": 396.1,
"r_x2": 170.0,
"r_y2": 387.2,
"r_x3": 50.1,
"r_y3": 387.2,
"coord_origin": "TOPLEFT"
},
"text": "cepts a large input image size.",
"orig": "cepts a large input image size.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 0,
"label": "table",
"bbox": {
"l": 53.4,
"t": 409.1,
"r": 283.0,
"b": 582.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.8,
"r_y0": 429.6,
"r_x1": 104.9,
"r_y1": 429.6,
"r_x2": 104.9,
"r_y2": 420.7,
"r_x3": 78.8,
"r_y3": 420.7,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.2,
"r_y0": 423.6,
"r_x1": 236.1,
"r_y1": 423.6,
"r_x2": 236.1,
"r_y2": 414.7,
"r_x3": 211.2,
"r_y3": 414.7,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 129.3,
"r_y0": 435.6,
"r_x1": 159.2,
"r_y1": 435.6,
"r_x2": 159.2,
"r_y2": 426.7,
"r_x3": 129.3,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.2,
"r_y0": 435.6,
"r_x1": 199.4,
"r_y1": 435.6,
"r_x2": 199.4,
"r_y2": 426.7,
"r_x3": 171.2,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.4,
"r_y0": 435.6,
"r_x1": 247.7,
"r_y1": 435.6,
"r_x2": 247.7,
"r_y2": 426.7,
"r_x3": 211.4,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 264.5,
"r_y0": 435.6,
"r_x1": 277.3,
"r_y1": 435.6,
"r_x2": 277.3,
"r_y2": 426.7,
"r_x3": 264.5,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 452.5,
"r_x1": 102.1,
"r_y1": 452.5,
"r_x2": 102.1,
"r_y2": 443.6,
"r_x3": 81.6,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 452.5,
"r_x1": 153.7,
"r_y1": 452.5,
"r_x2": 153.7,
"r_y2": 443.6,
"r_x3": 134.9,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 452.5,
"r_x1": 194.0,
"r_y1": 452.5,
"r_x2": 194.0,
"r_y2": 443.6,
"r_x3": 176.6,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "91.1",
"orig": "91.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 452.5,
"r_x1": 238.3,
"r_y1": 452.5,
"r_x2": 238.3,
"r_y2": 443.6,
"r_x3": 220.8,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "88.7",
"orig": "88.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 452.5,
"r_x1": 279.6,
"r_y1": 452.5,
"r_x2": 279.6,
"r_y2": 443.6,
"r_x3": 262.2,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "89.9",
"orig": "89.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.2,
"r_y0": 464.5,
"r_x1": 101.5,
"r_y1": 464.5,
"r_x2": 101.5,
"r_y2": 455.6,
"r_x3": 82.2,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 464.5,
"r_x1": 153.7,
"r_y1": 464.5,
"r_x2": 153.7,
"r_y2": 455.6,
"r_x3": 134.9,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 464.5,
"r_x1": 186.9,
"r_y1": 464.5,
"r_x2": 186.9,
"r_y2": 455.6,
"r_x3": 183.6,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 464.5,
"r_x1": 231.2,
"r_y1": 464.5,
"r_x2": 231.2,
"r_y2": 455.6,
"r_x3": 227.9,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 464.5,
"r_x1": 282.1,
"r_y1": 464.5,
"r_x2": 282.1,
"r_y2": 455.6,
"r_x3": 259.7,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "93.01",
"orig": "93.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 477.0,
"r_x1": 117.4,
"r_y1": 477.0,
"r_x2": 117.4,
"r_y2": 468.1,
"r_x3": 66.3,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 477.0,
"r_x1": 153.7,
"r_y1": 477.0,
"r_x2": 153.7,
"r_y2": 468.1,
"r_x3": 134.9,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 477.0,
"r_x1": 194.0,
"r_y1": 477.0,
"r_x2": 194.0,
"r_y2": 468.1,
"r_x3": 176.6,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "98.5",
"orig": "98.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 477.0,
"r_x1": 238.3,
"r_y1": 477.0,
"r_x2": 238.3,
"r_y2": 468.1,
"r_x3": 220.8,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "95.0",
"orig": "95.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 477.0,
"r_x1": 282.1,
"r_y1": 477.0,
"r_x2": 282.1,
"r_y2": 468.0,
"r_x3": 259.7,
"r_y3": 468.0,
"coord_origin": "TOPLEFT"
},
"text": "96.75",
"orig": "96.75",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 492.2,
"r_x1": 102.1,
"r_y1": 492.2,
"r_x2": 102.1,
"r_y2": 483.3,
"r_x3": 81.6,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 492.2,
"r_x1": 153.7,
"r_y1": 492.2,
"r_x2": 153.7,
"r_y2": 483.3,
"r_x3": 134.9,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 492.2,
"r_x1": 194.0,
"r_y1": 492.2,
"r_x2": 194.0,
"r_y2": 483.3,
"r_x3": 176.6,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "88.4",
"orig": "88.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.3,
"r_y0": 492.2,
"r_x1": 240.8,
"r_y1": 492.2,
"r_x2": 240.8,
"r_y2": 483.3,
"r_x3": 218.3,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "92.08",
"orig": "92.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 492.2,
"r_x1": 279.6,
"r_y1": 492.2,
"r_x2": 279.6,
"r_y2": 483.3,
"r_x3": 262.2,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "90.6",
"orig": "90.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.2,
"r_y0": 504.2,
"r_x1": 101.5,
"r_y1": 504.2,
"r_x2": 101.5,
"r_y2": 495.3,
"r_x3": 82.2,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 504.2,
"r_x1": 153.7,
"r_y1": 504.2,
"r_x2": 153.7,
"r_y2": 495.3,
"r_x3": 134.9,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 504.2,
"r_x1": 186.9,
"r_y1": 504.2,
"r_x2": 186.9,
"r_y2": 495.3,
"r_x3": 183.6,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 504.2,
"r_x1": 231.2,
"r_y1": 504.2,
"r_x2": 231.2,
"r_y2": 495.3,
"r_x3": 227.9,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 504.2,
"r_x1": 282.1,
"r_y1": 504.2,
"r_x2": 282.1,
"r_y2": 495.3,
"r_x3": 259.7,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "87.14",
"orig": "87.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.8,
"r_y0": 516.1,
"r_x1": 111.9,
"r_y1": 516.1,
"r_x2": 111.9,
"r_y2": 507.2,
"r_x3": 71.8,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "GTE (FT)",
"orig": "GTE (FT)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 516.1,
"r_x1": 153.7,
"r_y1": 516.1,
"r_x2": 153.7,
"r_y2": 507.2,
"r_x3": 134.9,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 516.1,
"r_x1": 186.9,
"r_y1": 516.1,
"r_x2": 186.9,
"r_y2": 507.2,
"r_x3": 183.6,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 516.1,
"r_x1": 231.2,
"r_y1": 516.1,
"r_x2": 231.2,
"r_y2": 507.2,
"r_x3": 227.9,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 516.1,
"r_x1": 282.1,
"r_y1": 516.1,
"r_x2": 282.1,
"r_y2": 507.2,
"r_x3": 259.7,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "91.02",
"orig": "91.02",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 528.1,
"r_x1": 117.4,
"r_y1": 528.1,
"r_x2": 117.4,
"r_y2": 519.2,
"r_x3": 66.3,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 528.1,
"r_x1": 153.7,
"r_y1": 528.1,
"r_x2": 153.7,
"r_y2": 519.2,
"r_x3": 134.9,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 528.1,
"r_x1": 194.0,
"r_y1": 528.1,
"r_x2": 194.0,
"r_y2": 519.2,
"r_x3": 176.6,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "97.5",
"orig": "97.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 528.1,
"r_x1": 238.3,
"r_y1": 528.1,
"r_x2": 238.3,
"r_y2": 519.2,
"r_x3": 220.8,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "96.0",
"orig": "96.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 528.0,
"r_x1": 279.6,
"r_y1": 528.0,
"r_x2": 279.6,
"r_y2": 519.1,
"r_x3": 262.2,
"r_y3": 519.1,
"coord_origin": "TOPLEFT"
},
"text": "96.8",
"orig": "96.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 545.4,
"r_x1": 102.1,
"r_y1": 545.4,
"r_x2": 102.1,
"r_y2": 536.5,
"r_x3": 81.6,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.9,
"r_y0": 545.4,
"r_x1": 150.6,
"r_y1": 545.4,
"r_x2": 150.6,
"r_y2": 536.5,
"r_x3": 137.9,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 545.4,
"r_x1": 194.0,
"r_y1": 545.4,
"r_x2": 194.0,
"r_y2": 536.5,
"r_x3": 176.6,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 545.4,
"r_x1": 231.2,
"r_y1": 545.4,
"r_x2": 231.2,
"r_y2": 536.5,
"r_x3": 227.9,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 545.4,
"r_x1": 279.6,
"r_y1": 545.4,
"r_x2": 279.6,
"r_y2": 536.5,
"r_x3": 262.2,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 557.4,
"r_x1": 117.4,
"r_y1": 557.4,
"r_x2": 117.4,
"r_y2": 548.5,
"r_x3": 66.3,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.9,
"r_y0": 557.4,
"r_x1": 150.6,
"r_y1": 557.4,
"r_x2": 150.6,
"r_y2": 548.5,
"r_x3": 137.9,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 557.4,
"r_x1": 194.0,
"r_y1": 557.4,
"r_x2": 194.0,
"r_y2": 548.5,
"r_x3": 176.6,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 557.4,
"r_x1": 231.2,
"r_y1": 557.4,
"r_x2": 231.2,
"r_y2": 548.5,
"r_x3": 227.9,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 557.3,
"r_x1": 279.6,
"r_y1": 557.3,
"r_x2": 279.6,
"r_y2": 548.3,
"r_x3": 262.2,
"r_y3": 548.3,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 576.9,
"r_x1": 117.4,
"r_y1": 576.9,
"r_x2": 117.4,
"r_y2": 568.0,
"r_x3": 66.3,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 576.9,
"r_x1": 153.7,
"r_y1": 576.9,
"r_x2": 153.7,
"r_y2": 568.0,
"r_x3": 134.9,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "STN",
"orig": "STN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 576.9,
"r_x1": 194.0,
"r_y1": 576.9,
"r_x2": 194.0,
"r_y2": 568.0,
"r_x3": 176.6,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.9",
"orig": "96.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 576.9,
"r_x1": 238.3,
"r_y1": 576.9,
"r_x2": 238.3,
"r_y2": 568.0,
"r_x3": 220.8,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "95.7",
"orig": "95.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 576.9,
"r_x1": 279.6,
"r_y1": 576.9,
"r_x2": 279.6,
"r_y2": 568.0,
"r_x3": 262.2,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.7",
"orig": "96.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 27,
"label": "text",
"bbox": {
"l": 78.8,
"t": 420.7,
"r": 104.9,
"b": 429.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.8,
"r_y0": 429.6,
"r_x1": 104.9,
"r_y1": 429.6,
"r_x2": 104.9,
"r_y2": 420.7,
"r_x3": 78.8,
"r_y3": 420.7,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 28,
"label": "text",
"bbox": {
"l": 211.2,
"t": 414.7,
"r": 236.1,
"b": 423.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.2,
"r_y0": 423.6,
"r_x1": 236.1,
"r_y1": 423.6,
"r_x2": 236.1,
"r_y2": 414.7,
"r_x3": 211.2,
"r_y3": 414.7,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "text",
"bbox": {
"l": 129.3,
"t": 426.7,
"r": 159.2,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 129.3,
"r_y0": 435.6,
"r_x1": 159.2,
"r_y1": 435.6,
"r_x2": 159.2,
"r_y2": 426.7,
"r_x3": 129.3,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 30,
"label": "text",
"bbox": {
"l": 171.2,
"t": 426.7,
"r": 199.4,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.2,
"r_y0": 435.6,
"r_x1": 199.4,
"r_y1": 435.6,
"r_x2": 199.4,
"r_y2": 426.7,
"r_x3": 171.2,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "text",
"bbox": {
"l": 211.4,
"t": 426.7,
"r": 247.7,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.4,
"r_y0": 435.6,
"r_x1": 247.7,
"r_y1": 435.6,
"r_x2": 247.7,
"r_y2": 426.7,
"r_x3": 211.4,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 32,
"label": "text",
"bbox": {
"l": 264.5,
"t": 426.7,
"r": 277.3,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 264.5,
"r_y0": 435.6,
"r_x1": 277.3,
"r_y1": 435.6,
"r_x2": 277.3,
"r_y2": 426.7,
"r_x3": 264.5,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 33,
"label": "text",
"bbox": {
"l": 81.6,
"t": 443.6,
"r": 102.1,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 452.5,
"r_x1": 102.1,
"r_y1": 452.5,
"r_x2": 102.1,
"r_y2": 443.6,
"r_x3": 81.6,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 34,
"label": "text",
"bbox": {
"l": 134.9,
"t": 443.6,
"r": 153.7,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 452.5,
"r_x1": 153.7,
"r_y1": 452.5,
"r_x2": 153.7,
"r_y2": 443.6,
"r_x3": 134.9,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 35,
"label": "text",
"bbox": {
"l": 176.6,
"t": 443.6,
"r": 194.0,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 452.5,
"r_x1": 194.0,
"r_y1": 452.5,
"r_x2": 194.0,
"r_y2": 443.6,
"r_x3": 176.6,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "91.1",
"orig": "91.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 36,
"label": "text",
"bbox": {
"l": 220.8,
"t": 443.6,
"r": 238.3,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 452.5,
"r_x1": 238.3,
"r_y1": 452.5,
"r_x2": 238.3,
"r_y2": 443.6,
"r_x3": 220.8,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "88.7",
"orig": "88.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 37,
"label": "text",
"bbox": {
"l": 262.2,
"t": 443.6,
"r": 279.6,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 452.5,
"r_x1": 279.6,
"r_y1": 452.5,
"r_x2": 279.6,
"r_y2": 443.6,
"r_x3": 262.2,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "89.9",
"orig": "89.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 38,
"label": "text",
"bbox": {
"l": 82.2,
"t": 455.6,
"r": 101.5,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.2,
"r_y0": 464.5,
"r_x1": 101.5,
"r_y1": 464.5,
"r_x2": 101.5,
"r_y2": 455.6,
"r_x3": 82.2,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 39,
"label": "text",
"bbox": {
"l": 134.9,
"t": 455.6,
"r": 153.7,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 464.5,
"r_x1": 153.7,
"r_y1": 464.5,
"r_x2": 153.7,
"r_y2": 455.6,
"r_x3": 134.9,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 40,
"label": "text",
"bbox": {
"l": 183.6,
"t": 455.6,
"r": 186.9,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 464.5,
"r_x1": 186.9,
"r_y1": 464.5,
"r_x2": 186.9,
"r_y2": 455.6,
"r_x3": 183.6,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 227.9,
"t": 455.6,
"r": 231.2,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 464.5,
"r_x1": 231.2,
"r_y1": 464.5,
"r_x2": 231.2,
"r_y2": 455.6,
"r_x3": 227.9,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 259.7,
"t": 455.6,
"r": 282.1,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 464.5,
"r_x1": 282.1,
"r_y1": 464.5,
"r_x2": 282.1,
"r_y2": 455.6,
"r_x3": 259.7,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "93.01",
"orig": "93.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 66.3,
"t": 468.1,
"r": 117.4,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 477.0,
"r_x1": 117.4,
"r_y1": 477.0,
"r_x2": 117.4,
"r_y2": 468.1,
"r_x3": 66.3,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 134.9,
"t": 468.1,
"r": 153.7,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 477.0,
"r_x1": 153.7,
"r_y1": 477.0,
"r_x2": 153.7,
"r_y2": 468.1,
"r_x3": 134.9,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 176.6,
"t": 468.1,
"r": 194.0,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 477.0,
"r_x1": 194.0,
"r_y1": 477.0,
"r_x2": 194.0,
"r_y2": 468.1,
"r_x3": 176.6,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "98.5",
"orig": "98.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 220.8,
"t": 468.1,
"r": 238.3,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 477.0,
"r_x1": 238.3,
"r_y1": 477.0,
"r_x2": 238.3,
"r_y2": 468.1,
"r_x3": 220.8,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "95.0",
"orig": "95.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 259.7,
"t": 468.0,
"r": 282.1,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 477.0,
"r_x1": 282.1,
"r_y1": 477.0,
"r_x2": 282.1,
"r_y2": 468.0,
"r_x3": 259.7,
"r_y3": 468.0,
"coord_origin": "TOPLEFT"
},
"text": "96.75",
"orig": "96.75",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 81.6,
"t": 483.3,
"r": 102.1,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 492.2,
"r_x1": 102.1,
"r_y1": 492.2,
"r_x2": 102.1,
"r_y2": 483.3,
"r_x3": 81.6,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 134.9,
"t": 483.3,
"r": 153.7,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 492.2,
"r_x1": 153.7,
"r_y1": 492.2,
"r_x2": 153.7,
"r_y2": 483.3,
"r_x3": 134.9,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 176.6,
"t": 483.3,
"r": 194.0,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 492.2,
"r_x1": 194.0,
"r_y1": 492.2,
"r_x2": 194.0,
"r_y2": 483.3,
"r_x3": 176.6,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "88.4",
"orig": "88.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 51,
"label": "text",
"bbox": {
"l": 218.3,
"t": 483.3,
"r": 240.8,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.3,
"r_y0": 492.2,
"r_x1": 240.8,
"r_y1": 492.2,
"r_x2": 240.8,
"r_y2": 483.3,
"r_x3": 218.3,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "92.08",
"orig": "92.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 52,
"label": "text",
"bbox": {
"l": 262.2,
"t": 483.3,
"r": 279.6,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 492.2,
"r_x1": 279.6,
"r_y1": 492.2,
"r_x2": 279.6,
"r_y2": 483.3,
"r_x3": 262.2,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "90.6",
"orig": "90.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 53,
"label": "text",
"bbox": {
"l": 82.2,
"t": 495.3,
"r": 101.5,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.2,
"r_y0": 504.2,
"r_x1": 101.5,
"r_y1": 504.2,
"r_x2": 101.5,
"r_y2": 495.3,
"r_x3": 82.2,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 54,
"label": "text",
"bbox": {
"l": 134.9,
"t": 495.3,
"r": 153.7,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 504.2,
"r_x1": 153.7,
"r_y1": 504.2,
"r_x2": 153.7,
"r_y2": 495.3,
"r_x3": 134.9,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 55,
"label": "text",
"bbox": {
"l": 183.6,
"t": 495.3,
"r": 186.9,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 504.2,
"r_x1": 186.9,
"r_y1": 504.2,
"r_x2": 186.9,
"r_y2": 495.3,
"r_x3": 183.6,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 227.9,
"t": 495.3,
"r": 231.2,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 504.2,
"r_x1": 231.2,
"r_y1": 504.2,
"r_x2": 231.2,
"r_y2": 495.3,
"r_x3": 227.9,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 259.7,
"t": 495.3,
"r": 282.1,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 504.2,
"r_x1": 282.1,
"r_y1": 504.2,
"r_x2": 282.1,
"r_y2": 495.3,
"r_x3": 259.7,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "87.14",
"orig": "87.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 71.8,
"t": 507.2,
"r": 111.9,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.8,
"r_y0": 516.1,
"r_x1": 111.9,
"r_y1": 516.1,
"r_x2": 111.9,
"r_y2": 507.2,
"r_x3": 71.8,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "GTE (FT)",
"orig": "GTE (FT)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 134.9,
"t": 507.2,
"r": 153.7,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 516.1,
"r_x1": 153.7,
"r_y1": 516.1,
"r_x2": 153.7,
"r_y2": 507.2,
"r_x3": 134.9,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 183.6,
"t": 507.2,
"r": 186.9,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 516.1,
"r_x1": 186.9,
"r_y1": 516.1,
"r_x2": 186.9,
"r_y2": 507.2,
"r_x3": 183.6,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 227.9,
"t": 507.2,
"r": 231.2,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 516.1,
"r_x1": 231.2,
"r_y1": 516.1,
"r_x2": 231.2,
"r_y2": 507.2,
"r_x3": 227.9,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 259.7,
"t": 507.2,
"r": 282.1,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 516.1,
"r_x1": 282.1,
"r_y1": 516.1,
"r_x2": 282.1,
"r_y2": 507.2,
"r_x3": 259.7,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "91.02",
"orig": "91.02",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 66.3,
"t": 519.2,
"r": 117.4,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 528.1,
"r_x1": 117.4,
"r_y1": 528.1,
"r_x2": 117.4,
"r_y2": 519.2,
"r_x3": 66.3,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 134.9,
"t": 519.2,
"r": 153.7,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 528.1,
"r_x1": 153.7,
"r_y1": 528.1,
"r_x2": 153.7,
"r_y2": 519.2,
"r_x3": 134.9,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 176.6,
"t": 519.2,
"r": 194.0,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 528.1,
"r_x1": 194.0,
"r_y1": 528.1,
"r_x2": 194.0,
"r_y2": 519.2,
"r_x3": 176.6,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "97.5",
"orig": "97.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 220.8,
"t": 519.2,
"r": 238.3,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 528.1,
"r_x1": 238.3,
"r_y1": 528.1,
"r_x2": 238.3,
"r_y2": 519.2,
"r_x3": 220.8,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "96.0",
"orig": "96.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 262.2,
"t": 519.1,
"r": 279.6,
"b": 528.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 528.0,
"r_x1": 279.6,
"r_y1": 528.0,
"r_x2": 279.6,
"r_y2": 519.1,
"r_x3": 262.2,
"r_y3": 519.1,
"coord_origin": "TOPLEFT"
},
"text": "96.8",
"orig": "96.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 81.6,
"t": 536.5,
"r": 102.1,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 545.4,
"r_x1": 102.1,
"r_y1": 545.4,
"r_x2": 102.1,
"r_y2": 536.5,
"r_x3": 81.6,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 137.9,
"t": 536.5,
"r": 150.6,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.9,
"r_y0": 545.4,
"r_x1": 150.6,
"r_y1": 545.4,
"r_x2": 150.6,
"r_y2": 536.5,
"r_x3": 137.9,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 176.6,
"t": 536.5,
"r": 194.0,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 545.4,
"r_x1": 194.0,
"r_y1": 545.4,
"r_x2": 194.0,
"r_y2": 536.5,
"r_x3": 176.6,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 227.9,
"t": 536.5,
"r": 231.2,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 545.4,
"r_x1": 231.2,
"r_y1": 545.4,
"r_x2": 231.2,
"r_y2": 536.5,
"r_x3": 227.9,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 262.2,
"t": 536.5,
"r": 279.6,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 545.4,
"r_x1": 279.6,
"r_y1": 545.4,
"r_x2": 279.6,
"r_y2": 536.5,
"r_x3": 262.2,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 66.3,
"t": 548.5,
"r": 117.4,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 557.4,
"r_x1": 117.4,
"r_y1": 557.4,
"r_x2": 117.4,
"r_y2": 548.5,
"r_x3": 66.3,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 137.9,
"t": 548.5,
"r": 150.6,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.9,
"r_y0": 557.4,
"r_x1": 150.6,
"r_y1": 557.4,
"r_x2": 150.6,
"r_y2": 548.5,
"r_x3": 137.9,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 176.6,
"t": 548.5,
"r": 194.0,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 557.4,
"r_x1": 194.0,
"r_y1": 557.4,
"r_x2": 194.0,
"r_y2": 548.5,
"r_x3": 176.6,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 227.9,
"t": 548.5,
"r": 231.2,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 557.4,
"r_x1": 231.2,
"r_y1": 557.4,
"r_x2": 231.2,
"r_y2": 548.5,
"r_x3": 227.9,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 262.2,
"t": 548.3,
"r": 279.6,
"b": 557.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 557.3,
"r_x1": 279.6,
"r_y1": 557.3,
"r_x2": 279.6,
"r_y2": 548.3,
"r_x3": 262.2,
"r_y3": 548.3,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 66.3,
"t": 568.0,
"r": 117.4,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 576.9,
"r_x1": 117.4,
"r_y1": 576.9,
"r_x2": 117.4,
"r_y2": 568.0,
"r_x3": 66.3,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 134.9,
"t": 568.0,
"r": 153.7,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 576.9,
"r_x1": 153.7,
"r_y1": 576.9,
"r_x2": 153.7,
"r_y2": 568.0,
"r_x3": 134.9,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "STN",
"orig": "STN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 176.6,
"t": 568.0,
"r": 194.0,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 576.9,
"r_x1": 194.0,
"r_y1": 576.9,
"r_x2": 194.0,
"r_y2": 568.0,
"r_x3": 176.6,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.9",
"orig": "96.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 220.8,
"t": 568.0,
"r": 238.3,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 576.9,
"r_x1": 238.3,
"r_y1": 576.9,
"r_x2": 238.3,
"r_y2": 568.0,
"r_x3": 220.8,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "95.7",
"orig": "95.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 262.2,
"t": 568.0,
"r": 279.6,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 576.9,
"r_x1": 279.6,
"r_y1": 576.9,
"r_x2": 279.6,
"r_y2": 568.0,
"r_x3": 262.2,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.7",
"orig": "96.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 15,
"label": "text",
"bbox": {
"l": 50.1,
"t": 592.4,
"r": 286.4,
"b": 613.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.72,
"cells": [
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 601.3,
"r_x1": 286.4,
"r_y1": 601.3,
"r_x2": 286.4,
"r_y2": 592.4,
"r_x3": 50.1,
"r_y3": 592.4,
"coord_origin": "TOPLEFT"
},
"text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet",
"orig": "Table 2: Structure results on PubTabNet (PTN), FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 613.3,
"r_x1": 247.5,
"r_y1": 613.3,
"r_x2": 247.5,
"r_y2": 604.4,
"r_x3": 50.1,
"r_y3": 604.4,
"coord_origin": "TOPLEFT"
},
"text": "(FTN), TableBank (TB) and SynthTabNet (STN).",
"orig": "(FTN), TableBank (TB) and SynthTabNet (STN).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 16,
"label": "text",
"bbox": {
"l": 50.1,
"t": 616.3,
"r": 261.8,
"b": 625.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.64,
"cells": [
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 625.2,
"r_x1": 261.8,
"r_y1": 625.2,
"r_x2": 261.8,
"r_y2": 616.3,
"r_x3": 50.1,
"r_y3": 616.3,
"coord_origin": "TOPLEFT"
},
"text": "FT: Model was trained on PubTabNet then finetuned.",
"orig": "FT: Model was trained on PubTabNet then finetuned.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "text",
"bbox": {
"l": 50.1,
"t": 644.3,
"r": 286.4,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 653.3,
"r_x1": 124.7,
"r_y1": 653.3,
"r_x2": 124.7,
"r_y2": 644.3,
"r_x3": 62.1,
"r_y3": 644.3,
"coord_origin": "TOPLEFT"
},
"text": "Cell Detection.",
"orig": "Cell Detection.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 128.2,
"r_y0": 653.4,
"r_x1": 242.9,
"r_y1": 653.4,
"r_x2": 242.9,
"r_y2": 644.5,
"r_x3": 128.2,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "Like any object detector, our",
"orig": "Like any object detector, our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 245.6,
"r_y0": 653.1,
"r_x1": 286.4,
"r_y1": 653.1,
"r_x2": 286.4,
"r_y2": 644.6,
"r_x3": 245.6,
"r_y3": 644.6,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox",
"orig": "Cell BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 665.1,
"r_x1": 85.0,
"r_y1": 665.1,
"r_x2": 85.0,
"r_y2": 656.5,
"r_x3": 50.1,
"r_y3": 656.5,
"coord_origin": "TOPLEFT"
},
"text": "Detector",
"orig": "Detector",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.5,
"r_y0": 665.3,
"r_x1": 286.4,
"r_y1": 665.3,
"r_x2": 286.4,
"r_y2": 656.4,
"r_x3": 89.5,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "provides bounding boxes that can be improved",
"orig": "provides bounding boxes that can be improved",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.3,
"r_x1": 286.4,
"r_y1": 677.3,
"r_x2": 286.4,
"r_y2": 668.4,
"r_x3": 50.1,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "with post-processing during inference. We make use of the",
"orig": "with post-processing during inference. We make use of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 689.2,
"r_x1": 286.4,
"r_y1": 689.2,
"r_x2": 286.4,
"r_y2": 680.3,
"r_x3": 50.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "grid-like structure of tables to refine the predictions. A de-",
"orig": "grid-like structure of tables to refine the predictions. A de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "tailed explanation on the post-processing is available in the",
"orig": "tailed explanation on the post-processing is available in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 286.4,
"r_y1": 713.2,
"r_x2": 286.4,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "supplementary material. As shown in Tab. 3, we evaluate",
"orig": "supplementary material. As shown in Tab. 3, we evaluate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 7,
"label": "text",
"bbox": {
"l": 308.9,
"t": 75.2,
"r": 545.1,
"b": 227.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 84.1,
"r_x1": 322.1,
"r_y1": 84.1,
"r_x2": 322.1,
"r_y2": 75.2,
"r_x3": 308.9,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "our",
"orig": "our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 325.5,
"r_y0": 83.9,
"r_x1": 404.6,
"r_y1": 83.9,
"r_x2": 404.6,
"r_y2": 75.3,
"r_x3": 325.5,
"r_y3": 75.3,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.1,
"r_y0": 84.1,
"r_x1": 545.1,
"r_y1": 84.1,
"r_x2": 545.1,
"r_y2": 75.2,
"r_x3": 408.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "accuracy for cells with a class la-",
"orig": "accuracy for cells with a class la-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 96.1,
"r_x1": 545.1,
"r_y1": 96.1,
"r_x2": 545.1,
"r_y2": 87.2,
"r_x3": 308.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric",
"orig": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 108.0,
"r_x1": 470.2,
"r_y1": 108.0,
"r_x2": 470.2,
"r_y2": 99.1,
"r_x3": 308.9,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "for pre-processing and post-processing.",
"orig": "for pre-processing and post-processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.5,
"r_y0": 108.0,
"r_x1": 545.1,
"r_y1": 108.0,
"r_x2": 545.1,
"r_y2": 99.1,
"r_x3": 477.5,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "Note that we do",
"orig": "Note that we do",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 120.0,
"r_x1": 545.1,
"r_y1": 120.0,
"r_x2": 545.1,
"r_y2": 111.1,
"r_x3": 308.9,
"r_y3": 111.1,
"coord_origin": "TOPLEFT"
},
"text": "not have post-processing results for SynthTabNet as images",
"orig": "not have post-processing results for SynthTabNet as images",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 131.9,
"r_x1": 545.1,
"r_y1": 131.9,
"r_x2": 545.1,
"r_y2": 123.0,
"r_x3": 308.9,
"r_y3": 123.0,
"coord_origin": "TOPLEFT"
},
"text": "are only provided. To compare the performance of our pro-",
"orig": "are only provided. To compare the performance of our pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 143.9,
"r_x1": 502.0,
"r_y1": 143.9,
"r_x2": 502.0,
"r_y2": 135.0,
"r_x3": 308.9,
"r_y3": 135.0,
"coord_origin": "TOPLEFT"
},
"text": "posed approach, we\u2019ve integrated TableFormer\u2019s",
"orig": "posed approach, we\u2019ve integrated TableFormer\u2019s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 504.5,
"r_y0": 143.7,
"r_x1": 545.1,
"r_y1": 143.7,
"r_x2": 545.1,
"r_y2": 135.1,
"r_x3": 504.5,
"r_y3": 135.1,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox",
"orig": "Cell BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 155.6,
"r_x1": 343.2,
"r_y1": 155.6,
"r_x2": 343.2,
"r_y2": 147.0,
"r_x3": 308.9,
"r_y3": 147.0,
"coord_origin": "TOPLEFT"
},
"text": "Decoder",
"orig": "Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.4,
"r_y0": 155.8,
"r_x1": 545.1,
"r_y1": 155.8,
"r_x2": 545.1,
"r_y2": 146.9,
"r_x3": 346.4,
"r_y3": 146.9,
"coord_origin": "TOPLEFT"
},
"text": "into EDD architecture. As mentioned previously,",
"orig": "into EDD architecture. As mentioned previously,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 167.8,
"r_x1": 446.2,
"r_y1": 167.8,
"r_x2": 446.2,
"r_y2": 158.9,
"r_x3": 308.9,
"r_y3": 158.9,
"coord_origin": "TOPLEFT"
},
"text": "the Structure Decoder provides the",
"orig": "the Structure Decoder provides the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.3,
"r_y0": 167.6,
"r_x1": 525.0,
"r_y1": 167.6,
"r_x2": 525.0,
"r_y2": 159.0,
"r_x3": 448.3,
"r_y3": 159.0,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 527.4,
"r_y0": 167.8,
"r_x1": 545.1,
"r_y1": 167.8,
"r_x2": 545.1,
"r_y2": 158.9,
"r_x3": 527.4,
"r_y3": 158.9,
"coord_origin": "TOPLEFT"
},
"text": "with",
"orig": "with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 179.8,
"r_x1": 545.1,
"r_y1": 179.8,
"r_x2": 545.1,
"r_y2": 170.8,
"r_x3": 308.9,
"r_y3": 170.8,
"coord_origin": "TOPLEFT"
},
"text": "the features needed to predict the bounding box predictions.",
"orig": "the features needed to predict the bounding box predictions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 191.7,
"r_x1": 432.9,
"r_y1": 191.7,
"r_x2": 432.9,
"r_y2": 182.8,
"r_x3": 308.9,
"r_y3": 182.8,
"coord_origin": "TOPLEFT"
},
"text": "Therefore, the accuracy of the",
"orig": "Therefore, the accuracy of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 436.4,
"r_y0": 191.5,
"r_x1": 510.9,
"r_y1": 191.5,
"r_x2": 510.9,
"r_y2": 182.9,
"r_x3": 436.4,
"r_y3": 182.9,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.7,
"r_y0": 191.7,
"r_x1": 545.1,
"r_y1": 191.7,
"r_x2": 545.1,
"r_y2": 182.8,
"r_x3": 514.7,
"r_y3": 182.8,
"coord_origin": "TOPLEFT"
},
"text": "directly",
"orig": "directly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 203.7,
"r_x1": 431.2,
"r_y1": 203.7,
"r_x2": 431.2,
"r_y2": 194.8,
"r_x3": 308.9,
"r_y3": 194.8,
"coord_origin": "TOPLEFT"
},
"text": "influences the accuracy of the",
"orig": "influences the accuracy of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 434.7,
"r_y0": 203.4,
"r_x1": 514.2,
"r_y1": 203.4,
"r_x2": 514.2,
"r_y2": 194.8,
"r_x3": 434.7,
"r_y3": 194.8,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.2,
"r_y0": 203.7,
"r_x1": 545.1,
"r_y1": 203.7,
"r_x2": 545.1,
"r_y2": 194.8,
"r_x3": 514.2,
"r_y3": 194.8,
"coord_origin": "TOPLEFT"
},
"text": ". If the",
"orig": ". If the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 215.4,
"r_x1": 382.4,
"r_y1": 215.4,
"r_x2": 382.4,
"r_y2": 206.8,
"r_x3": 308.9,
"r_y3": 206.8,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.1,
"r_y0": 215.6,
"r_x1": 545.1,
"r_y1": 215.6,
"r_x2": 545.1,
"r_y2": 206.7,
"r_x3": 385.1,
"r_y3": 206.7,
"coord_origin": "TOPLEFT"
},
"text": "predicts an extra column, this will result",
"orig": "predicts an extra column, this will result",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 227.6,
"r_x1": 501.7,
"r_y1": 227.6,
"r_x2": 501.7,
"r_y2": 218.7,
"r_x3": 308.9,
"r_y3": 218.7,
"coord_origin": "TOPLEFT"
},
"text": "in an extra column of predicted bounding boxes.",
"orig": "in an extra column of predicted bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 8,
"label": "table",
"bbox": {
"l": 308.4,
"t": 247.9,
"r": 533.6,
"b": 303.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.3,
"r_y0": 262.6,
"r_x1": 365.3,
"r_y1": 262.6,
"r_x2": 365.3,
"r_y2": 253.7,
"r_x3": 339.3,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 401.0,
"r_y0": 262.6,
"r_x1": 430.9,
"r_y1": 262.6,
"r_x2": 430.9,
"r_y2": 253.7,
"r_x3": 401.0,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 454.1,
"r_y0": 262.6,
"r_x1": 474.6,
"r_y1": 262.6,
"r_x2": 474.6,
"r_y2": 253.7,
"r_x3": 454.1,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "mAP",
"orig": "mAP",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 486.5,
"r_y0": 262.6,
"r_x1": 527.2,
"r_y1": 262.6,
"r_x2": 527.2,
"r_y2": 253.7,
"r_x3": 486.5,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "mAP (PP)",
"orig": "mAP (PP)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.7,
"r_y0": 279.5,
"r_x1": 377.0,
"r_y1": 279.5,
"r_x2": 377.0,
"r_y2": 270.6,
"r_x3": 327.7,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "EDD+BBox",
"orig": "EDD+BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 279.5,
"r_x1": 438.3,
"r_y1": 279.5,
"r_x2": 438.3,
"r_y2": 270.6,
"r_x3": 393.7,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 279.5,
"r_x1": 473.1,
"r_y1": 279.5,
"r_x2": 473.1,
"r_y2": 270.6,
"r_x3": 455.6,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "79.2",
"orig": "79.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.2,
"r_y0": 279.5,
"r_x1": 515.6,
"r_y1": 279.5,
"r_x2": 515.6,
"r_y2": 270.6,
"r_x3": 498.2,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "82.7",
"orig": "82.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 291.5,
"r_x1": 377.9,
"r_y1": 291.5,
"r_x2": 377.9,
"r_y2": 282.6,
"r_x3": 326.8,
"r_y3": 282.6,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 291.5,
"r_x1": 438.3,
"r_y1": 291.5,
"r_x2": 438.3,
"r_y2": 282.6,
"r_x3": 393.7,
"r_y3": 282.6,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 291.4,
"r_x1": 473.1,
"r_y1": 291.4,
"r_x2": 473.1,
"r_y2": 282.5,
"r_x3": 455.6,
"r_y3": 282.5,
"coord_origin": "TOPLEFT"
},
"text": "82.1",
"orig": "82.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.2,
"r_y0": 291.4,
"r_x1": 515.6,
"r_y1": 291.4,
"r_x2": 515.6,
"r_y2": 282.5,
"r_x3": 498.2,
"r_y3": 282.5,
"coord_origin": "TOPLEFT"
},
"text": "86.8",
"orig": "86.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 303.4,
"r_x1": 377.9,
"r_y1": 303.4,
"r_x2": 377.9,
"r_y2": 294.5,
"r_x3": 326.8,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.8,
"r_y0": 303.4,
"r_x1": 442.2,
"r_y1": 303.4,
"r_x2": 442.2,
"r_y2": 294.5,
"r_x3": 389.8,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 303.4,
"r_x1": 473.1,
"r_y1": 303.4,
"r_x2": 473.1,
"r_y2": 294.5,
"r_x3": 455.6,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "87.7",
"orig": "87.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 505.2,
"r_y0": 303.4,
"r_x1": 508.5,
"r_y1": 303.4,
"r_x2": 508.5,
"r_y2": 294.5,
"r_x3": 505.2,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 83,
"label": "text",
"bbox": {
"l": 339.3,
"t": 253.7,
"r": 365.3,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.3,
"r_y0": 262.6,
"r_x1": 365.3,
"r_y1": 262.6,
"r_x2": 365.3,
"r_y2": 253.7,
"r_x3": 339.3,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 401.0,
"t": 253.7,
"r": 430.9,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 401.0,
"r_y0": 262.6,
"r_x1": 430.9,
"r_y1": 262.6,
"r_x2": 430.9,
"r_y2": 253.7,
"r_x3": 401.0,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 454.1,
"t": 253.7,
"r": 474.6,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 454.1,
"r_y0": 262.6,
"r_x1": 474.6,
"r_y1": 262.6,
"r_x2": 474.6,
"r_y2": 253.7,
"r_x3": 454.1,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "mAP",
"orig": "mAP",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 486.5,
"t": 253.7,
"r": 527.2,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 486.5,
"r_y0": 262.6,
"r_x1": 527.2,
"r_y1": 262.6,
"r_x2": 527.2,
"r_y2": 253.7,
"r_x3": 486.5,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "mAP (PP)",
"orig": "mAP (PP)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 327.7,
"t": 270.6,
"r": 377.0,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.7,
"r_y0": 279.5,
"r_x1": 377.0,
"r_y1": 279.5,
"r_x2": 377.0,
"r_y2": 270.6,
"r_x3": 327.7,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "EDD+BBox",
"orig": "EDD+BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 393.7,
"t": 270.6,
"r": 438.3,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 279.5,
"r_x1": 438.3,
"r_y1": 279.5,
"r_x2": 438.3,
"r_y2": 270.6,
"r_x3": 393.7,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 455.6,
"t": 270.6,
"r": 473.1,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 279.5,
"r_x1": 473.1,
"r_y1": 279.5,
"r_x2": 473.1,
"r_y2": 270.6,
"r_x3": 455.6,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "79.2",
"orig": "79.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 498.2,
"t": 270.6,
"r": 515.6,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.2,
"r_y0": 279.5,
"r_x1": 515.6,
"r_y1": 279.5,
"r_x2": 515.6,
"r_y2": 270.6,
"r_x3": 498.2,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "82.7",
"orig": "82.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 326.8,
"t": 282.6,
"r": 377.9,
"b": 291.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 291.5,
"r_x1": 377.9,
"r_y1": 291.5,
"r_x2": 377.9,
"r_y2": 282.6,
"r_x3": 326.8,
"r_y3": 282.6,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 393.7,
"t": 282.6,
"r": 438.3,
"b": 291.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 291.5,
"r_x1": 438.3,
"r_y1": 291.5,
"r_x2": 438.3,
"r_y2": 282.6,
"r_x3": 393.7,
"r_y3": 282.6,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 455.6,
"t": 282.5,
"r": 473.1,
"b": 291.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 291.4,
"r_x1": 473.1,
"r_y1": 291.4,
"r_x2": 473.1,
"r_y2": 282.5,
"r_x3": 455.6,
"r_y3": 282.5,
"coord_origin": "TOPLEFT"
},
"text": "82.1",
"orig": "82.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 498.2,
"t": 282.5,
"r": 515.6,
"b": 291.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.2,
"r_y0": 291.4,
"r_x1": 515.6,
"r_y1": 291.4,
"r_x2": 515.6,
"r_y2": 282.5,
"r_x3": 498.2,
"r_y3": 282.5,
"coord_origin": "TOPLEFT"
},
"text": "86.8",
"orig": "86.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 326.8,
"t": 294.5,
"r": 377.9,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 303.4,
"r_x1": 377.9,
"r_y1": 303.4,
"r_x2": 377.9,
"r_y2": 294.5,
"r_x3": 326.8,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 389.8,
"t": 294.5,
"r": 442.2,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.8,
"r_y0": 303.4,
"r_x1": 442.2,
"r_y1": 303.4,
"r_x2": 442.2,
"r_y2": 294.5,
"r_x3": 389.8,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 455.6,
"t": 294.5,
"r": 473.1,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 303.4,
"r_x1": 473.1,
"r_y1": 303.4,
"r_x2": 473.1,
"r_y2": 294.5,
"r_x3": 455.6,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "87.7",
"orig": "87.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 505.2,
"t": 294.5,
"r": 508.5,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 505.2,
"r_y0": 303.4,
"r_x1": 508.5,
"r_y1": 303.4,
"r_x2": 508.5,
"r_y2": 294.5,
"r_x3": 505.2,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 12,
"label": "caption",
"bbox": {
"l": 308.9,
"t": 316.4,
"r": 545.1,
"b": 337.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 325.4,
"r_x1": 341.5,
"r_y1": 325.4,
"r_x2": 341.5,
"r_y2": 316.4,
"r_x3": 308.9,
"r_y3": 316.4,
"coord_origin": "TOPLEFT"
},
"text": "Table 3:",
"orig": "Table 3:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.6,
"r_y0": 325.4,
"r_x1": 545.1,
"r_y1": 325.4,
"r_x2": 545.1,
"r_y2": 316.4,
"r_x3": 348.6,
"r_y3": 316.4,
"coord_origin": "TOPLEFT"
},
"text": "Cell Bounding Box detection results on PubTab-",
"orig": "Cell Bounding Box detection results on PubTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 337.3,
"r_x1": 475.0,
"r_y1": 337.3,
"r_x2": 475.0,
"r_y2": 328.4,
"r_x3": 308.9,
"r_y3": 328.4,
"coord_origin": "TOPLEFT"
},
"text": "Net, and FinTabNet. PP: Post-processing.",
"orig": "Net, and FinTabNet. PP: Post-processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "text",
"bbox": {
"l": 308.9,
"t": 367.7,
"r": 545.1,
"b": 520.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 376.6,
"r_x1": 378.9,
"r_y1": 376.6,
"r_x2": 378.9,
"r_y2": 367.7,
"r_x3": 320.8,
"r_y3": 367.7,
"coord_origin": "TOPLEFT"
},
"text": "Cell Content.",
"orig": "Cell Content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 387.1,
"r_y0": 376.7,
"r_x1": 545.1,
"r_y1": 376.7,
"r_x2": 545.1,
"r_y2": 367.8,
"r_x3": 387.1,
"r_y3": 367.8,
"coord_origin": "TOPLEFT"
},
"text": "In this section, we evaluate the entire",
"orig": "In this section, we evaluate the entire",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 388.7,
"r_x1": 487.2,
"r_y1": 388.7,
"r_x2": 487.2,
"r_y2": 379.8,
"r_x3": 308.9,
"r_y3": 379.8,
"coord_origin": "TOPLEFT"
},
"text": "pipeline of recovering a table with content.",
"orig": "pipeline of recovering a table with content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 494.0,
"r_y0": 388.7,
"r_x1": 545.1,
"r_y1": 388.7,
"r_x2": 545.1,
"r_y2": 379.8,
"r_x3": 494.0,
"r_y3": 379.8,
"coord_origin": "TOPLEFT"
},
"text": "Here we put",
"orig": "Here we put",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 400.6,
"r_x1": 545.1,
"r_y1": 400.6,
"r_x2": 545.1,
"r_y2": 391.7,
"r_x3": 308.9,
"r_y3": 391.7,
"coord_origin": "TOPLEFT"
},
"text": "our approach to test by capitalizing on extracting content",
"orig": "our approach to test by capitalizing on extracting content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 412.6,
"r_x1": 545.1,
"r_y1": 412.6,
"r_x2": 545.1,
"r_y2": 403.7,
"r_x3": 308.9,
"r_y3": 403.7,
"coord_origin": "TOPLEFT"
},
"text": "from the PDF cells rather than decoding from images. Tab.",
"orig": "from the PDF cells rather than decoding from images. Tab.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 424.5,
"r_x1": 314.1,
"r_y1": 424.5,
"r_x2": 314.1,
"r_y2": 415.6,
"r_x3": 308.9,
"r_y3": 415.6,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.7,
"r_y0": 424.5,
"r_x1": 545.1,
"r_y1": 424.5,
"r_x2": 545.1,
"r_y2": 415.6,
"r_x3": 316.7,
"r_y3": 415.6,
"coord_origin": "TOPLEFT"
},
"text": "shows the TEDs score of HTML code representing the",
"orig": "shows the TEDs score of HTML code representing the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 436.5,
"r_x1": 545.1,
"r_y1": 436.5,
"r_x2": 545.1,
"r_y2": 427.6,
"r_x3": 308.9,
"r_y3": 427.6,
"coord_origin": "TOPLEFT"
},
"text": "structure of the table along with the content inserted in the",
"orig": "structure of the table along with the content inserted in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 448.4,
"r_x1": 545.1,
"r_y1": 448.4,
"r_x2": 545.1,
"r_y2": 439.5,
"r_x3": 308.9,
"r_y3": 439.5,
"coord_origin": "TOPLEFT"
},
"text": "data cell and compared with the ground-truth. Our method",
"orig": "data cell and compared with the ground-truth. Our method",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 460.4,
"r_x1": 350.2,
"r_y1": 460.4,
"r_x2": 350.2,
"r_y2": 451.5,
"r_x3": 308.9,
"r_y3": 451.5,
"coord_origin": "TOPLEFT"
},
"text": "achieved a",
"orig": "achieved a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.2,
"r_y0": 460.3,
"r_x1": 374.6,
"r_y1": 460.3,
"r_x2": 374.6,
"r_y2": 451.4,
"r_x3": 352.2,
"r_y3": 451.4,
"coord_origin": "TOPLEFT"
},
"text": "5.3%",
"orig": "5.3%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 376.5,
"r_y0": 460.4,
"r_x1": 545.1,
"r_y1": 460.4,
"r_x2": 545.1,
"r_y2": 451.5,
"r_x3": 376.5,
"r_y3": 451.5,
"coord_origin": "TOPLEFT"
},
"text": "increase over the state-of-the-art, and com-",
"orig": "increase over the state-of-the-art, and com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 472.3,
"r_x1": 545.1,
"r_y1": 472.3,
"r_x2": 545.1,
"r_y2": 463.4,
"r_x3": 308.9,
"r_y3": 463.4,
"coord_origin": "TOPLEFT"
},
"text": "mercial solutions. We believe our scores would be higher",
"orig": "mercial solutions. We believe our scores would be higher",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 484.3,
"r_x1": 545.1,
"r_y1": 484.3,
"r_x2": 545.1,
"r_y2": 475.4,
"r_x3": 308.9,
"r_y3": 475.4,
"coord_origin": "TOPLEFT"
},
"text": "if the HTML ground-truth matched the extracted PDF cell",
"orig": "if the HTML ground-truth matched the extracted PDF cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 496.3,
"r_x1": 545.1,
"r_y1": 496.3,
"r_x2": 545.1,
"r_y2": 487.4,
"r_x3": 308.9,
"r_y3": 487.4,
"coord_origin": "TOPLEFT"
},
"text": "content. Unfortunately, there are small discrepancies such",
"orig": "content. Unfortunately, there are small discrepancies such",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 508.2,
"r_x1": 545.1,
"r_y1": 508.2,
"r_x2": 545.1,
"r_y2": 499.3,
"r_x3": 308.9,
"r_y3": 499.3,
"coord_origin": "TOPLEFT"
},
"text": "as spacings around words or special characters with various",
"orig": "as spacings around words or special characters with various",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 520.2,
"r_x1": 405.7,
"r_y1": 520.2,
"r_x2": 405.7,
"r_y2": 511.3,
"r_x3": 308.9,
"r_y3": 511.3,
"coord_origin": "TOPLEFT"
},
"text": "unicode representations.",
"orig": "unicode representations.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 5,
"label": "table",
"bbox": {
"l": 333.0,
"t": 540.3,
"r": 520.9,
"b": 643.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 358.0,
"r_y0": 561.1,
"r_x1": 384.0,
"r_y1": 561.1,
"r_x2": 384.0,
"r_y2": 552.2,
"r_x3": 358.0,
"r_y3": 552.2,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.0,
"r_y0": 555.2,
"r_x1": 473.9,
"r_y1": 555.2,
"r_x2": 473.9,
"r_y2": 546.3,
"r_x3": 449.0,
"r_y3": 546.3,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.5,
"r_y0": 567.1,
"r_x1": 436.7,
"r_y1": 567.1,
"r_x2": 436.7,
"r_y2": 558.2,
"r_x3": 408.5,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.7,
"r_y0": 567.1,
"r_x1": 485.1,
"r_y1": 567.1,
"r_x2": 485.1,
"r_y2": 558.2,
"r_x3": 448.7,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.4,
"r_y0": 567.1,
"r_x1": 512.1,
"r_y1": 567.1,
"r_x2": 512.1,
"r_y2": 558.2,
"r_x3": 499.4,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.7,
"r_y0": 584.1,
"r_x1": 384.4,
"r_y1": 584.1,
"r_x2": 384.4,
"r_y2": 575.2,
"r_x3": 357.7,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "Tabula",
"orig": "Tabula",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 584.1,
"r_x1": 431.3,
"r_y1": 584.1,
"r_x2": 431.3,
"r_y2": 575.2,
"r_x3": 413.9,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "78.0",
"orig": "78.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 584.1,
"r_x1": 475.6,
"r_y1": 584.1,
"r_x2": 475.6,
"r_y2": 575.2,
"r_x3": 458.2,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "57.8",
"orig": "57.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 584.1,
"r_x1": 514.5,
"r_y1": 584.1,
"r_x2": 514.5,
"r_y2": 575.2,
"r_x3": 497.0,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "67.9",
"orig": "67.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 350.7,
"r_y0": 596.0,
"r_x1": 391.3,
"r_y1": 596.0,
"r_x2": 391.3,
"r_y2": 587.1,
"r_x3": 350.7,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "Traprange",
"orig": "Traprange",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 596.0,
"r_x1": 431.3,
"r_y1": 596.0,
"r_x2": 431.3,
"r_y2": 587.1,
"r_x3": 413.9,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "60.8",
"orig": "60.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 596.0,
"r_x1": 475.6,
"r_y1": 596.0,
"r_x2": 475.6,
"r_y2": 587.1,
"r_x3": 458.2,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "49.9",
"orig": "49.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 596.0,
"r_x1": 514.5,
"r_y1": 596.0,
"r_x2": 514.5,
"r_y2": 587.1,
"r_x3": 497.0,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "55.4",
"orig": "55.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.1,
"r_y0": 608.0,
"r_x1": 387.9,
"r_y1": 608.0,
"r_x2": 387.9,
"r_y2": 599.1,
"r_x3": 354.1,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "Camelot",
"orig": "Camelot",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 608.0,
"r_x1": 431.3,
"r_y1": 608.0,
"r_x2": 431.3,
"r_y2": 599.1,
"r_x3": 413.9,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "80.0",
"orig": "80.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 608.0,
"r_x1": 475.6,
"r_y1": 608.0,
"r_x2": 475.6,
"r_y2": 599.1,
"r_x3": 458.2,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "66.0",
"orig": "66.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 608.0,
"r_x1": 514.5,
"r_y1": 608.0,
"r_x2": 514.5,
"r_y2": 599.1,
"r_x3": 497.0,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "73.0",
"orig": "73.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.6,
"r_y0": 619.9,
"r_x1": 395.5,
"r_y1": 619.9,
"r_x2": 395.5,
"r_y2": 611.0,
"r_x3": 346.6,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "Acrobat Pro",
"orig": "Acrobat Pro",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 619.9,
"r_x1": 431.3,
"r_y1": 619.9,
"r_x2": 431.3,
"r_y2": 611.0,
"r_x3": 413.9,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "68.9",
"orig": "68.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 619.9,
"r_x1": 475.6,
"r_y1": 619.9,
"r_x2": 475.6,
"r_y2": 611.0,
"r_x3": 458.2,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "61.8",
"orig": "61.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 619.9,
"r_x1": 514.5,
"r_y1": 619.9,
"r_x2": 514.5,
"r_y2": 611.0,
"r_x3": 497.0,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "65.3",
"orig": "65.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.8,
"r_y0": 631.9,
"r_x1": 381.3,
"r_y1": 631.9,
"r_x2": 381.3,
"r_y2": 623.0,
"r_x3": 360.8,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 631.9,
"r_x1": 431.3,
"r_y1": 631.9,
"r_x2": 431.3,
"r_y2": 623.0,
"r_x3": 413.9,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "91.2",
"orig": "91.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 631.9,
"r_x1": 475.6,
"r_y1": 631.9,
"r_x2": 475.6,
"r_y2": 623.0,
"r_x3": 458.2,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "85.4",
"orig": "85.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 631.9,
"r_x1": 514.5,
"r_y1": 631.9,
"r_x2": 514.5,
"r_y2": 623.0,
"r_x3": 497.0,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "88.3",
"orig": "88.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.5,
"r_y0": 643.8,
"r_x1": 396.6,
"r_y1": 643.8,
"r_x2": 396.6,
"r_y2": 634.9,
"r_x3": 345.5,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 643.8,
"r_x1": 431.3,
"r_y1": 643.8,
"r_x2": 431.3,
"r_y2": 634.9,
"r_x3": 413.9,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "95.4",
"orig": "95.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 643.8,
"r_x1": 475.6,
"r_y1": 643.8,
"r_x2": 475.6,
"r_y2": 634.9,
"r_x3": 458.2,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "90.1",
"orig": "90.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 643.8,
"r_x1": 514.5,
"r_y1": 643.8,
"r_x2": 514.5,
"r_y2": 634.8,
"r_x3": 497.0,
"r_y3": 634.8,
"coord_origin": "TOPLEFT"
},
"text": "93.6",
"orig": "93.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 99,
"label": "text",
"bbox": {
"l": 358.0,
"t": 552.2,
"r": 384.0,
"b": 561.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 358.0,
"r_y0": 561.1,
"r_x1": 384.0,
"r_y1": 561.1,
"r_x2": 384.0,
"r_y2": 552.2,
"r_x3": 358.0,
"r_y3": 552.2,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 449.0,
"t": 546.3,
"r": 473.9,
"b": 555.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.0,
"r_y0": 555.2,
"r_x1": 473.9,
"r_y1": 555.2,
"r_x2": 473.9,
"r_y2": 546.3,
"r_x3": 449.0,
"r_y3": 546.3,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 408.5,
"t": 558.2,
"r": 436.7,
"b": 567.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.5,
"r_y0": 567.1,
"r_x1": 436.7,
"r_y1": 567.1,
"r_x2": 436.7,
"r_y2": 558.2,
"r_x3": 408.5,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 448.7,
"t": 558.2,
"r": 485.1,
"b": 567.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.7,
"r_y0": 567.1,
"r_x1": 485.1,
"r_y1": 567.1,
"r_x2": 485.1,
"r_y2": 558.2,
"r_x3": 448.7,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 499.4,
"t": 558.2,
"r": 512.1,
"b": 567.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.4,
"r_y0": 567.1,
"r_x1": 512.1,
"r_y1": 567.1,
"r_x2": 512.1,
"r_y2": 558.2,
"r_x3": 499.4,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 357.7,
"t": 575.2,
"r": 384.4,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.7,
"r_y0": 584.1,
"r_x1": 384.4,
"r_y1": 584.1,
"r_x2": 384.4,
"r_y2": 575.2,
"r_x3": 357.7,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "Tabula",
"orig": "Tabula",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 105,
"label": "text",
"bbox": {
"l": 413.9,
"t": 575.2,
"r": 431.3,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 584.1,
"r_x1": 431.3,
"r_y1": 584.1,
"r_x2": 431.3,
"r_y2": 575.2,
"r_x3": 413.9,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "78.0",
"orig": "78.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 106,
"label": "text",
"bbox": {
"l": 458.2,
"t": 575.2,
"r": 475.6,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 584.1,
"r_x1": 475.6,
"r_y1": 584.1,
"r_x2": 475.6,
"r_y2": 575.2,
"r_x3": 458.2,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "57.8",
"orig": "57.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 107,
"label": "text",
"bbox": {
"l": 497.0,
"t": 575.2,
"r": 514.5,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 584.1,
"r_x1": 514.5,
"r_y1": 584.1,
"r_x2": 514.5,
"r_y2": 575.2,
"r_x3": 497.0,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "67.9",
"orig": "67.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 108,
"label": "text",
"bbox": {
"l": 350.7,
"t": 587.1,
"r": 391.3,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 350.7,
"r_y0": 596.0,
"r_x1": 391.3,
"r_y1": 596.0,
"r_x2": 391.3,
"r_y2": 587.1,
"r_x3": 350.7,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "Traprange",
"orig": "Traprange",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 109,
"label": "text",
"bbox": {
"l": 413.9,
"t": 587.1,
"r": 431.3,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 596.0,
"r_x1": 431.3,
"r_y1": 596.0,
"r_x2": 431.3,
"r_y2": 587.1,
"r_x3": 413.9,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "60.8",
"orig": "60.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 110,
"label": "text",
"bbox": {
"l": 458.2,
"t": 587.1,
"r": 475.6,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 596.0,
"r_x1": 475.6,
"r_y1": 596.0,
"r_x2": 475.6,
"r_y2": 587.1,
"r_x3": 458.2,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "49.9",
"orig": "49.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 111,
"label": "text",
"bbox": {
"l": 497.0,
"t": 587.1,
"r": 514.5,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 596.0,
"r_x1": 514.5,
"r_y1": 596.0,
"r_x2": 514.5,
"r_y2": 587.1,
"r_x3": 497.0,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "55.4",
"orig": "55.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 112,
"label": "text",
"bbox": {
"l": 354.1,
"t": 599.1,
"r": 387.9,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.1,
"r_y0": 608.0,
"r_x1": 387.9,
"r_y1": 608.0,
"r_x2": 387.9,
"r_y2": 599.1,
"r_x3": 354.1,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "Camelot",
"orig": "Camelot",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 113,
"label": "text",
"bbox": {
"l": 413.9,
"t": 599.1,
"r": 431.3,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 608.0,
"r_x1": 431.3,
"r_y1": 608.0,
"r_x2": 431.3,
"r_y2": 599.1,
"r_x3": 413.9,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "80.0",
"orig": "80.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 114,
"label": "text",
"bbox": {
"l": 458.2,
"t": 599.1,
"r": 475.6,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 608.0,
"r_x1": 475.6,
"r_y1": 608.0,
"r_x2": 475.6,
"r_y2": 599.1,
"r_x3": 458.2,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "66.0",
"orig": "66.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 115,
"label": "text",
"bbox": {
"l": 497.0,
"t": 599.1,
"r": 514.5,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 608.0,
"r_x1": 514.5,
"r_y1": 608.0,
"r_x2": 514.5,
"r_y2": 599.1,
"r_x3": 497.0,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "73.0",
"orig": "73.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 116,
"label": "text",
"bbox": {
"l": 346.6,
"t": 611.0,
"r": 395.5,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.6,
"r_y0": 619.9,
"r_x1": 395.5,
"r_y1": 619.9,
"r_x2": 395.5,
"r_y2": 611.0,
"r_x3": 346.6,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "Acrobat Pro",
"orig": "Acrobat Pro",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 117,
"label": "text",
"bbox": {
"l": 413.9,
"t": 611.0,
"r": 431.3,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 619.9,
"r_x1": 431.3,
"r_y1": 619.9,
"r_x2": 431.3,
"r_y2": 611.0,
"r_x3": 413.9,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "68.9",
"orig": "68.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 118,
"label": "text",
"bbox": {
"l": 458.2,
"t": 611.0,
"r": 475.6,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 619.9,
"r_x1": 475.6,
"r_y1": 619.9,
"r_x2": 475.6,
"r_y2": 611.0,
"r_x3": 458.2,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "61.8",
"orig": "61.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 119,
"label": "text",
"bbox": {
"l": 497.0,
"t": 611.0,
"r": 514.5,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 619.9,
"r_x1": 514.5,
"r_y1": 619.9,
"r_x2": 514.5,
"r_y2": 611.0,
"r_x3": 497.0,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "65.3",
"orig": "65.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 120,
"label": "text",
"bbox": {
"l": 360.8,
"t": 623.0,
"r": 381.3,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.8,
"r_y0": 631.9,
"r_x1": 381.3,
"r_y1": 631.9,
"r_x2": 381.3,
"r_y2": 623.0,
"r_x3": 360.8,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 121,
"label": "text",
"bbox": {
"l": 413.9,
"t": 623.0,
"r": 431.3,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 631.9,
"r_x1": 431.3,
"r_y1": 631.9,
"r_x2": 431.3,
"r_y2": 623.0,
"r_x3": 413.9,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "91.2",
"orig": "91.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 122,
"label": "text",
"bbox": {
"l": 458.2,
"t": 623.0,
"r": 475.6,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 631.9,
"r_x1": 475.6,
"r_y1": 631.9,
"r_x2": 475.6,
"r_y2": 623.0,
"r_x3": 458.2,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "85.4",
"orig": "85.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 123,
"label": "text",
"bbox": {
"l": 497.0,
"t": 623.0,
"r": 514.5,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 631.9,
"r_x1": 514.5,
"r_y1": 631.9,
"r_x2": 514.5,
"r_y2": 623.0,
"r_x3": 497.0,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "88.3",
"orig": "88.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 124,
"label": "text",
"bbox": {
"l": 345.5,
"t": 634.9,
"r": 396.6,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.5,
"r_y0": 643.8,
"r_x1": 396.6,
"r_y1": 643.8,
"r_x2": 396.6,
"r_y2": 634.9,
"r_x3": 345.5,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 125,
"label": "text",
"bbox": {
"l": 413.9,
"t": 634.9,
"r": 431.3,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 643.8,
"r_x1": 431.3,
"r_y1": 643.8,
"r_x2": 431.3,
"r_y2": 634.9,
"r_x3": 413.9,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "95.4",
"orig": "95.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 126,
"label": "text",
"bbox": {
"l": 458.2,
"t": 634.9,
"r": 475.6,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 643.8,
"r_x1": 475.6,
"r_y1": 643.8,
"r_x2": 475.6,
"r_y2": 634.9,
"r_x3": 458.2,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "90.1",
"orig": "90.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 127,
"label": "text",
"bbox": {
"l": 497.0,
"t": 634.8,
"r": 514.5,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 643.8,
"r_x1": 514.5,
"r_y1": 643.8,
"r_x2": 514.5,
"r_y2": 634.8,
"r_x3": 497.0,
"r_y3": 634.8,
"coord_origin": "TOPLEFT"
},
"text": "93.6",
"orig": "93.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 11,
"label": "caption",
"bbox": {
"l": 308.9,
"t": 656.9,
"r": 545.1,
"b": 689.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 212,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 665.8,
"r_x1": 341.7,
"r_y1": 665.8,
"r_x2": 341.7,
"r_y2": 656.9,
"r_x3": 308.9,
"r_y3": 656.9,
"coord_origin": "TOPLEFT"
},
"text": "Table 4:",
"orig": "Table 4:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 213,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 349.6,
"r_y0": 665.8,
"r_x1": 545.1,
"r_y1": 665.8,
"r_x2": 545.1,
"r_y2": 656.9,
"r_x3": 349.6,
"r_y3": 656.9,
"coord_origin": "TOPLEFT"
},
"text": "Results of structure with content retrieved using",
"orig": "Results of structure with content retrieved using",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 214,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 677.7,
"r_x1": 545.1,
"r_y1": 677.7,
"r_x2": 545.1,
"r_y2": 668.8,
"r_x3": 308.9,
"r_y3": 668.8,
"coord_origin": "TOPLEFT"
},
"text": "cell detection on PubTabNet. In all cases the input is PDF",
"orig": "cell detection on PubTabNet. In all cases the input is PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 215,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 689.7,
"r_x1": 435.0,
"r_y1": 689.7,
"r_x2": 435.0,
"r_y2": 680.8,
"r_x3": 308.9,
"r_y3": 680.8,
"coord_origin": "TOPLEFT"
},
"text": "documents with cropped tables.",
"orig": "documents with cropped tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 14,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 216,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"tablestructure": {
"table_map": {
"0": {
"label": "table",
"id": 0,
"page_no": 6,
"cluster": {
"id": 0,
"label": "table",
"bbox": {
"l": 53.4,
"t": 409.1,
"r": 283.0,
"b": 582.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.8,
"r_y0": 429.6,
"r_x1": 104.9,
"r_y1": 429.6,
"r_x2": 104.9,
"r_y2": 420.7,
"r_x3": 78.8,
"r_y3": 420.7,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.2,
"r_y0": 423.6,
"r_x1": 236.1,
"r_y1": 423.6,
"r_x2": 236.1,
"r_y2": 414.7,
"r_x3": 211.2,
"r_y3": 414.7,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 129.3,
"r_y0": 435.6,
"r_x1": 159.2,
"r_y1": 435.6,
"r_x2": 159.2,
"r_y2": 426.7,
"r_x3": 129.3,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.2,
"r_y0": 435.6,
"r_x1": 199.4,
"r_y1": 435.6,
"r_x2": 199.4,
"r_y2": 426.7,
"r_x3": 171.2,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.4,
"r_y0": 435.6,
"r_x1": 247.7,
"r_y1": 435.6,
"r_x2": 247.7,
"r_y2": 426.7,
"r_x3": 211.4,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 264.5,
"r_y0": 435.6,
"r_x1": 277.3,
"r_y1": 435.6,
"r_x2": 277.3,
"r_y2": 426.7,
"r_x3": 264.5,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 452.5,
"r_x1": 102.1,
"r_y1": 452.5,
"r_x2": 102.1,
"r_y2": 443.6,
"r_x3": 81.6,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 452.5,
"r_x1": 153.7,
"r_y1": 452.5,
"r_x2": 153.7,
"r_y2": 443.6,
"r_x3": 134.9,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 452.5,
"r_x1": 194.0,
"r_y1": 452.5,
"r_x2": 194.0,
"r_y2": 443.6,
"r_x3": 176.6,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "91.1",
"orig": "91.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 452.5,
"r_x1": 238.3,
"r_y1": 452.5,
"r_x2": 238.3,
"r_y2": 443.6,
"r_x3": 220.8,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "88.7",
"orig": "88.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 452.5,
"r_x1": 279.6,
"r_y1": 452.5,
"r_x2": 279.6,
"r_y2": 443.6,
"r_x3": 262.2,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "89.9",
"orig": "89.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.2,
"r_y0": 464.5,
"r_x1": 101.5,
"r_y1": 464.5,
"r_x2": 101.5,
"r_y2": 455.6,
"r_x3": 82.2,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 464.5,
"r_x1": 153.7,
"r_y1": 464.5,
"r_x2": 153.7,
"r_y2": 455.6,
"r_x3": 134.9,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 464.5,
"r_x1": 186.9,
"r_y1": 464.5,
"r_x2": 186.9,
"r_y2": 455.6,
"r_x3": 183.6,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 464.5,
"r_x1": 231.2,
"r_y1": 464.5,
"r_x2": 231.2,
"r_y2": 455.6,
"r_x3": 227.9,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 464.5,
"r_x1": 282.1,
"r_y1": 464.5,
"r_x2": 282.1,
"r_y2": 455.6,
"r_x3": 259.7,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "93.01",
"orig": "93.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 477.0,
"r_x1": 117.4,
"r_y1": 477.0,
"r_x2": 117.4,
"r_y2": 468.1,
"r_x3": 66.3,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 477.0,
"r_x1": 153.7,
"r_y1": 477.0,
"r_x2": 153.7,
"r_y2": 468.1,
"r_x3": 134.9,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 477.0,
"r_x1": 194.0,
"r_y1": 477.0,
"r_x2": 194.0,
"r_y2": 468.1,
"r_x3": 176.6,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "98.5",
"orig": "98.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 477.0,
"r_x1": 238.3,
"r_y1": 477.0,
"r_x2": 238.3,
"r_y2": 468.1,
"r_x3": 220.8,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "95.0",
"orig": "95.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 477.0,
"r_x1": 282.1,
"r_y1": 477.0,
"r_x2": 282.1,
"r_y2": 468.0,
"r_x3": 259.7,
"r_y3": 468.0,
"coord_origin": "TOPLEFT"
},
"text": "96.75",
"orig": "96.75",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 492.2,
"r_x1": 102.1,
"r_y1": 492.2,
"r_x2": 102.1,
"r_y2": 483.3,
"r_x3": 81.6,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 492.2,
"r_x1": 153.7,
"r_y1": 492.2,
"r_x2": 153.7,
"r_y2": 483.3,
"r_x3": 134.9,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 492.2,
"r_x1": 194.0,
"r_y1": 492.2,
"r_x2": 194.0,
"r_y2": 483.3,
"r_x3": 176.6,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "88.4",
"orig": "88.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.3,
"r_y0": 492.2,
"r_x1": 240.8,
"r_y1": 492.2,
"r_x2": 240.8,
"r_y2": 483.3,
"r_x3": 218.3,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "92.08",
"orig": "92.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 492.2,
"r_x1": 279.6,
"r_y1": 492.2,
"r_x2": 279.6,
"r_y2": 483.3,
"r_x3": 262.2,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "90.6",
"orig": "90.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.2,
"r_y0": 504.2,
"r_x1": 101.5,
"r_y1": 504.2,
"r_x2": 101.5,
"r_y2": 495.3,
"r_x3": 82.2,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 504.2,
"r_x1": 153.7,
"r_y1": 504.2,
"r_x2": 153.7,
"r_y2": 495.3,
"r_x3": 134.9,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 504.2,
"r_x1": 186.9,
"r_y1": 504.2,
"r_x2": 186.9,
"r_y2": 495.3,
"r_x3": 183.6,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 504.2,
"r_x1": 231.2,
"r_y1": 504.2,
"r_x2": 231.2,
"r_y2": 495.3,
"r_x3": 227.9,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 504.2,
"r_x1": 282.1,
"r_y1": 504.2,
"r_x2": 282.1,
"r_y2": 495.3,
"r_x3": 259.7,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "87.14",
"orig": "87.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.8,
"r_y0": 516.1,
"r_x1": 111.9,
"r_y1": 516.1,
"r_x2": 111.9,
"r_y2": 507.2,
"r_x3": 71.8,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "GTE (FT)",
"orig": "GTE (FT)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 516.1,
"r_x1": 153.7,
"r_y1": 516.1,
"r_x2": 153.7,
"r_y2": 507.2,
"r_x3": 134.9,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 516.1,
"r_x1": 186.9,
"r_y1": 516.1,
"r_x2": 186.9,
"r_y2": 507.2,
"r_x3": 183.6,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 516.1,
"r_x1": 231.2,
"r_y1": 516.1,
"r_x2": 231.2,
"r_y2": 507.2,
"r_x3": 227.9,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 516.1,
"r_x1": 282.1,
"r_y1": 516.1,
"r_x2": 282.1,
"r_y2": 507.2,
"r_x3": 259.7,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "91.02",
"orig": "91.02",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 528.1,
"r_x1": 117.4,
"r_y1": 528.1,
"r_x2": 117.4,
"r_y2": 519.2,
"r_x3": 66.3,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 528.1,
"r_x1": 153.7,
"r_y1": 528.1,
"r_x2": 153.7,
"r_y2": 519.2,
"r_x3": 134.9,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 528.1,
"r_x1": 194.0,
"r_y1": 528.1,
"r_x2": 194.0,
"r_y2": 519.2,
"r_x3": 176.6,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "97.5",
"orig": "97.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 528.1,
"r_x1": 238.3,
"r_y1": 528.1,
"r_x2": 238.3,
"r_y2": 519.2,
"r_x3": 220.8,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "96.0",
"orig": "96.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 528.0,
"r_x1": 279.6,
"r_y1": 528.0,
"r_x2": 279.6,
"r_y2": 519.1,
"r_x3": 262.2,
"r_y3": 519.1,
"coord_origin": "TOPLEFT"
},
"text": "96.8",
"orig": "96.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 545.4,
"r_x1": 102.1,
"r_y1": 545.4,
"r_x2": 102.1,
"r_y2": 536.5,
"r_x3": 81.6,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.9,
"r_y0": 545.4,
"r_x1": 150.6,
"r_y1": 545.4,
"r_x2": 150.6,
"r_y2": 536.5,
"r_x3": 137.9,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 545.4,
"r_x1": 194.0,
"r_y1": 545.4,
"r_x2": 194.0,
"r_y2": 536.5,
"r_x3": 176.6,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 545.4,
"r_x1": 231.2,
"r_y1": 545.4,
"r_x2": 231.2,
"r_y2": 536.5,
"r_x3": 227.9,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 545.4,
"r_x1": 279.6,
"r_y1": 545.4,
"r_x2": 279.6,
"r_y2": 536.5,
"r_x3": 262.2,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 557.4,
"r_x1": 117.4,
"r_y1": 557.4,
"r_x2": 117.4,
"r_y2": 548.5,
"r_x3": 66.3,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.9,
"r_y0": 557.4,
"r_x1": 150.6,
"r_y1": 557.4,
"r_x2": 150.6,
"r_y2": 548.5,
"r_x3": 137.9,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 557.4,
"r_x1": 194.0,
"r_y1": 557.4,
"r_x2": 194.0,
"r_y2": 548.5,
"r_x3": 176.6,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 557.4,
"r_x1": 231.2,
"r_y1": 557.4,
"r_x2": 231.2,
"r_y2": 548.5,
"r_x3": 227.9,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 557.3,
"r_x1": 279.6,
"r_y1": 557.3,
"r_x2": 279.6,
"r_y2": 548.3,
"r_x3": 262.2,
"r_y3": 548.3,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 576.9,
"r_x1": 117.4,
"r_y1": 576.9,
"r_x2": 117.4,
"r_y2": 568.0,
"r_x3": 66.3,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 576.9,
"r_x1": 153.7,
"r_y1": 576.9,
"r_x2": 153.7,
"r_y2": 568.0,
"r_x3": 134.9,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "STN",
"orig": "STN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 576.9,
"r_x1": 194.0,
"r_y1": 576.9,
"r_x2": 194.0,
"r_y2": 568.0,
"r_x3": 176.6,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.9",
"orig": "96.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 576.9,
"r_x1": 238.3,
"r_y1": 576.9,
"r_x2": 238.3,
"r_y2": 568.0,
"r_x3": 220.8,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "95.7",
"orig": "95.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 576.9,
"r_x1": 279.6,
"r_y1": 576.9,
"r_x2": 279.6,
"r_y2": 568.0,
"r_x3": 262.2,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.7",
"orig": "96.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 27,
"label": "text",
"bbox": {
"l": 78.8,
"t": 420.7,
"r": 104.9,
"b": 429.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.8,
"r_y0": 429.6,
"r_x1": 104.9,
"r_y1": 429.6,
"r_x2": 104.9,
"r_y2": 420.7,
"r_x3": 78.8,
"r_y3": 420.7,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 28,
"label": "text",
"bbox": {
"l": 211.2,
"t": 414.7,
"r": 236.1,
"b": 423.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.2,
"r_y0": 423.6,
"r_x1": 236.1,
"r_y1": 423.6,
"r_x2": 236.1,
"r_y2": 414.7,
"r_x3": 211.2,
"r_y3": 414.7,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "text",
"bbox": {
"l": 129.3,
"t": 426.7,
"r": 159.2,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 129.3,
"r_y0": 435.6,
"r_x1": 159.2,
"r_y1": 435.6,
"r_x2": 159.2,
"r_y2": 426.7,
"r_x3": 129.3,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 30,
"label": "text",
"bbox": {
"l": 171.2,
"t": 426.7,
"r": 199.4,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.2,
"r_y0": 435.6,
"r_x1": 199.4,
"r_y1": 435.6,
"r_x2": 199.4,
"r_y2": 426.7,
"r_x3": 171.2,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "text",
"bbox": {
"l": 211.4,
"t": 426.7,
"r": 247.7,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.4,
"r_y0": 435.6,
"r_x1": 247.7,
"r_y1": 435.6,
"r_x2": 247.7,
"r_y2": 426.7,
"r_x3": 211.4,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 32,
"label": "text",
"bbox": {
"l": 264.5,
"t": 426.7,
"r": 277.3,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 264.5,
"r_y0": 435.6,
"r_x1": 277.3,
"r_y1": 435.6,
"r_x2": 277.3,
"r_y2": 426.7,
"r_x3": 264.5,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 33,
"label": "text",
"bbox": {
"l": 81.6,
"t": 443.6,
"r": 102.1,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 452.5,
"r_x1": 102.1,
"r_y1": 452.5,
"r_x2": 102.1,
"r_y2": 443.6,
"r_x3": 81.6,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 34,
"label": "text",
"bbox": {
"l": 134.9,
"t": 443.6,
"r": 153.7,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 452.5,
"r_x1": 153.7,
"r_y1": 452.5,
"r_x2": 153.7,
"r_y2": 443.6,
"r_x3": 134.9,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 35,
"label": "text",
"bbox": {
"l": 176.6,
"t": 443.6,
"r": 194.0,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 452.5,
"r_x1": 194.0,
"r_y1": 452.5,
"r_x2": 194.0,
"r_y2": 443.6,
"r_x3": 176.6,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "91.1",
"orig": "91.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 36,
"label": "text",
"bbox": {
"l": 220.8,
"t": 443.6,
"r": 238.3,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 452.5,
"r_x1": 238.3,
"r_y1": 452.5,
"r_x2": 238.3,
"r_y2": 443.6,
"r_x3": 220.8,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "88.7",
"orig": "88.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 37,
"label": "text",
"bbox": {
"l": 262.2,
"t": 443.6,
"r": 279.6,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 452.5,
"r_x1": 279.6,
"r_y1": 452.5,
"r_x2": 279.6,
"r_y2": 443.6,
"r_x3": 262.2,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "89.9",
"orig": "89.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 38,
"label": "text",
"bbox": {
"l": 82.2,
"t": 455.6,
"r": 101.5,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.2,
"r_y0": 464.5,
"r_x1": 101.5,
"r_y1": 464.5,
"r_x2": 101.5,
"r_y2": 455.6,
"r_x3": 82.2,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 39,
"label": "text",
"bbox": {
"l": 134.9,
"t": 455.6,
"r": 153.7,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 464.5,
"r_x1": 153.7,
"r_y1": 464.5,
"r_x2": 153.7,
"r_y2": 455.6,
"r_x3": 134.9,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 40,
"label": "text",
"bbox": {
"l": 183.6,
"t": 455.6,
"r": 186.9,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 464.5,
"r_x1": 186.9,
"r_y1": 464.5,
"r_x2": 186.9,
"r_y2": 455.6,
"r_x3": 183.6,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 227.9,
"t": 455.6,
"r": 231.2,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 464.5,
"r_x1": 231.2,
"r_y1": 464.5,
"r_x2": 231.2,
"r_y2": 455.6,
"r_x3": 227.9,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 259.7,
"t": 455.6,
"r": 282.1,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 464.5,
"r_x1": 282.1,
"r_y1": 464.5,
"r_x2": 282.1,
"r_y2": 455.6,
"r_x3": 259.7,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "93.01",
"orig": "93.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 66.3,
"t": 468.1,
"r": 117.4,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 477.0,
"r_x1": 117.4,
"r_y1": 477.0,
"r_x2": 117.4,
"r_y2": 468.1,
"r_x3": 66.3,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 134.9,
"t": 468.1,
"r": 153.7,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 477.0,
"r_x1": 153.7,
"r_y1": 477.0,
"r_x2": 153.7,
"r_y2": 468.1,
"r_x3": 134.9,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 176.6,
"t": 468.1,
"r": 194.0,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 477.0,
"r_x1": 194.0,
"r_y1": 477.0,
"r_x2": 194.0,
"r_y2": 468.1,
"r_x3": 176.6,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "98.5",
"orig": "98.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 220.8,
"t": 468.1,
"r": 238.3,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 477.0,
"r_x1": 238.3,
"r_y1": 477.0,
"r_x2": 238.3,
"r_y2": 468.1,
"r_x3": 220.8,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "95.0",
"orig": "95.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 259.7,
"t": 468.0,
"r": 282.1,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 477.0,
"r_x1": 282.1,
"r_y1": 477.0,
"r_x2": 282.1,
"r_y2": 468.0,
"r_x3": 259.7,
"r_y3": 468.0,
"coord_origin": "TOPLEFT"
},
"text": "96.75",
"orig": "96.75",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 81.6,
"t": 483.3,
"r": 102.1,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 492.2,
"r_x1": 102.1,
"r_y1": 492.2,
"r_x2": 102.1,
"r_y2": 483.3,
"r_x3": 81.6,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 134.9,
"t": 483.3,
"r": 153.7,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 492.2,
"r_x1": 153.7,
"r_y1": 492.2,
"r_x2": 153.7,
"r_y2": 483.3,
"r_x3": 134.9,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 176.6,
"t": 483.3,
"r": 194.0,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 492.2,
"r_x1": 194.0,
"r_y1": 492.2,
"r_x2": 194.0,
"r_y2": 483.3,
"r_x3": 176.6,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "88.4",
"orig": "88.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 51,
"label": "text",
"bbox": {
"l": 218.3,
"t": 483.3,
"r": 240.8,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.3,
"r_y0": 492.2,
"r_x1": 240.8,
"r_y1": 492.2,
"r_x2": 240.8,
"r_y2": 483.3,
"r_x3": 218.3,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "92.08",
"orig": "92.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 52,
"label": "text",
"bbox": {
"l": 262.2,
"t": 483.3,
"r": 279.6,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 492.2,
"r_x1": 279.6,
"r_y1": 492.2,
"r_x2": 279.6,
"r_y2": 483.3,
"r_x3": 262.2,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "90.6",
"orig": "90.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 53,
"label": "text",
"bbox": {
"l": 82.2,
"t": 495.3,
"r": 101.5,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.2,
"r_y0": 504.2,
"r_x1": 101.5,
"r_y1": 504.2,
"r_x2": 101.5,
"r_y2": 495.3,
"r_x3": 82.2,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 54,
"label": "text",
"bbox": {
"l": 134.9,
"t": 495.3,
"r": 153.7,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 504.2,
"r_x1": 153.7,
"r_y1": 504.2,
"r_x2": 153.7,
"r_y2": 495.3,
"r_x3": 134.9,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 55,
"label": "text",
"bbox": {
"l": 183.6,
"t": 495.3,
"r": 186.9,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 504.2,
"r_x1": 186.9,
"r_y1": 504.2,
"r_x2": 186.9,
"r_y2": 495.3,
"r_x3": 183.6,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 227.9,
"t": 495.3,
"r": 231.2,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 504.2,
"r_x1": 231.2,
"r_y1": 504.2,
"r_x2": 231.2,
"r_y2": 495.3,
"r_x3": 227.9,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 259.7,
"t": 495.3,
"r": 282.1,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 504.2,
"r_x1": 282.1,
"r_y1": 504.2,
"r_x2": 282.1,
"r_y2": 495.3,
"r_x3": 259.7,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "87.14",
"orig": "87.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 71.8,
"t": 507.2,
"r": 111.9,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.8,
"r_y0": 516.1,
"r_x1": 111.9,
"r_y1": 516.1,
"r_x2": 111.9,
"r_y2": 507.2,
"r_x3": 71.8,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "GTE (FT)",
"orig": "GTE (FT)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 134.9,
"t": 507.2,
"r": 153.7,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 516.1,
"r_x1": 153.7,
"r_y1": 516.1,
"r_x2": 153.7,
"r_y2": 507.2,
"r_x3": 134.9,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 183.6,
"t": 507.2,
"r": 186.9,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 516.1,
"r_x1": 186.9,
"r_y1": 516.1,
"r_x2": 186.9,
"r_y2": 507.2,
"r_x3": 183.6,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 227.9,
"t": 507.2,
"r": 231.2,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 516.1,
"r_x1": 231.2,
"r_y1": 516.1,
"r_x2": 231.2,
"r_y2": 507.2,
"r_x3": 227.9,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 259.7,
"t": 507.2,
"r": 282.1,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 516.1,
"r_x1": 282.1,
"r_y1": 516.1,
"r_x2": 282.1,
"r_y2": 507.2,
"r_x3": 259.7,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "91.02",
"orig": "91.02",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 66.3,
"t": 519.2,
"r": 117.4,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 528.1,
"r_x1": 117.4,
"r_y1": 528.1,
"r_x2": 117.4,
"r_y2": 519.2,
"r_x3": 66.3,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 134.9,
"t": 519.2,
"r": 153.7,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 528.1,
"r_x1": 153.7,
"r_y1": 528.1,
"r_x2": 153.7,
"r_y2": 519.2,
"r_x3": 134.9,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 176.6,
"t": 519.2,
"r": 194.0,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 528.1,
"r_x1": 194.0,
"r_y1": 528.1,
"r_x2": 194.0,
"r_y2": 519.2,
"r_x3": 176.6,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "97.5",
"orig": "97.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 220.8,
"t": 519.2,
"r": 238.3,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 528.1,
"r_x1": 238.3,
"r_y1": 528.1,
"r_x2": 238.3,
"r_y2": 519.2,
"r_x3": 220.8,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "96.0",
"orig": "96.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 262.2,
"t": 519.1,
"r": 279.6,
"b": 528.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 528.0,
"r_x1": 279.6,
"r_y1": 528.0,
"r_x2": 279.6,
"r_y2": 519.1,
"r_x3": 262.2,
"r_y3": 519.1,
"coord_origin": "TOPLEFT"
},
"text": "96.8",
"orig": "96.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 81.6,
"t": 536.5,
"r": 102.1,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 545.4,
"r_x1": 102.1,
"r_y1": 545.4,
"r_x2": 102.1,
"r_y2": 536.5,
"r_x3": 81.6,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 137.9,
"t": 536.5,
"r": 150.6,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.9,
"r_y0": 545.4,
"r_x1": 150.6,
"r_y1": 545.4,
"r_x2": 150.6,
"r_y2": 536.5,
"r_x3": 137.9,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 176.6,
"t": 536.5,
"r": 194.0,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 545.4,
"r_x1": 194.0,
"r_y1": 545.4,
"r_x2": 194.0,
"r_y2": 536.5,
"r_x3": 176.6,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 227.9,
"t": 536.5,
"r": 231.2,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 545.4,
"r_x1": 231.2,
"r_y1": 545.4,
"r_x2": 231.2,
"r_y2": 536.5,
"r_x3": 227.9,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 262.2,
"t": 536.5,
"r": 279.6,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 545.4,
"r_x1": 279.6,
"r_y1": 545.4,
"r_x2": 279.6,
"r_y2": 536.5,
"r_x3": 262.2,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 66.3,
"t": 548.5,
"r": 117.4,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 557.4,
"r_x1": 117.4,
"r_y1": 557.4,
"r_x2": 117.4,
"r_y2": 548.5,
"r_x3": 66.3,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 137.9,
"t": 548.5,
"r": 150.6,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.9,
"r_y0": 557.4,
"r_x1": 150.6,
"r_y1": 557.4,
"r_x2": 150.6,
"r_y2": 548.5,
"r_x3": 137.9,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 176.6,
"t": 548.5,
"r": 194.0,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 557.4,
"r_x1": 194.0,
"r_y1": 557.4,
"r_x2": 194.0,
"r_y2": 548.5,
"r_x3": 176.6,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 227.9,
"t": 548.5,
"r": 231.2,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 557.4,
"r_x1": 231.2,
"r_y1": 557.4,
"r_x2": 231.2,
"r_y2": 548.5,
"r_x3": 227.9,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 262.2,
"t": 548.3,
"r": 279.6,
"b": 557.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 557.3,
"r_x1": 279.6,
"r_y1": 557.3,
"r_x2": 279.6,
"r_y2": 548.3,
"r_x3": 262.2,
"r_y3": 548.3,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 66.3,
"t": 568.0,
"r": 117.4,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 576.9,
"r_x1": 117.4,
"r_y1": 576.9,
"r_x2": 117.4,
"r_y2": 568.0,
"r_x3": 66.3,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 134.9,
"t": 568.0,
"r": 153.7,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 576.9,
"r_x1": 153.7,
"r_y1": 576.9,
"r_x2": 153.7,
"r_y2": 568.0,
"r_x3": 134.9,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "STN",
"orig": "STN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 176.6,
"t": 568.0,
"r": 194.0,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 576.9,
"r_x1": 194.0,
"r_y1": 576.9,
"r_x2": 194.0,
"r_y2": 568.0,
"r_x3": 176.6,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.9",
"orig": "96.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 220.8,
"t": 568.0,
"r": 238.3,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 576.9,
"r_x1": 238.3,
"r_y1": 576.9,
"r_x2": 238.3,
"r_y2": 568.0,
"r_x3": 220.8,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "95.7",
"orig": "95.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 262.2,
"t": 568.0,
"r": 279.6,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 576.9,
"r_x1": 279.6,
"r_y1": 576.9,
"r_x2": 279.6,
"r_y2": 568.0,
"r_x3": 262.2,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.7",
"orig": "96.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 11,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 78.8,
"t": 420.7,
"r": 104.9,
"b": 429.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Model",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 211.2,
"t": 414.7,
"r": 236.1,
"b": 423.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "TEDS Complex",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 129.3,
"t": 426.7,
"r": 159.2,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Dataset",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 171.2,
"t": 426.7,
"r": 199.4,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "Simple",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 264.5,
"t": 426.7,
"r": 277.3,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "All",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 81.6,
"t": 443.6,
"r": 102.1,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 443.6,
"r": 153.7,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.6,
"t": 443.6,
"r": 194.0,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "91.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.8,
"t": 443.6,
"r": 238.3,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "88.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.2,
"t": 443.6,
"r": 279.6,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "89.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 82.2,
"t": 455.6,
"r": 101.5,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "GTE",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 455.6,
"r": 153.7,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 183.6,
"t": 455.6,
"r": 186.9,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.9,
"t": 455.6,
"r": 231.2,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.7,
"t": 455.6,
"r": 282.1,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "93.01",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.3,
"t": 468.1,
"r": 117.4,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 468.1,
"r": 153.7,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.6,
"t": 468.1,
"r": 194.0,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "98.5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.8,
"t": 468.1,
"r": 238.3,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "95.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.7,
"t": 468.0,
"r": 282.1,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "96.75",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 81.6,
"t": 483.3,
"r": 102.1,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 483.3,
"r": 153.7,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.6,
"t": 483.3,
"r": 194.0,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "88.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 218.3,
"t": 483.3,
"r": 240.8,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "92.08",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.2,
"t": 483.3,
"r": 279.6,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "90.6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 82.2,
"t": 495.3,
"r": 101.5,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "GTE",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 495.3,
"r": 153.7,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 183.6,
"t": 495.3,
"r": 186.9,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.9,
"t": 495.3,
"r": 231.2,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.7,
"t": 495.3,
"r": 282.1,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "87.14",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 71.8,
"t": 507.2,
"r": 111.9,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "GTE (FT)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 507.2,
"r": 153.7,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 183.6,
"t": 507.2,
"r": 186.9,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.9,
"t": 507.2,
"r": 231.2,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.7,
"t": 507.2,
"r": 282.1,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "91.02",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.3,
"t": 519.2,
"r": 117.4,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 519.2,
"r": 153.7,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.6,
"t": 519.2,
"r": 194.0,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "97.5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.8,
"t": 519.2,
"r": 238.3,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "96.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.2,
"t": 519.1,
"r": 279.6,
"b": 528.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "96.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 81.6,
"t": 536.5,
"r": 102.1,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 137.9,
"t": 536.5,
"r": 150.6,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "TB",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.6,
"t": 536.5,
"r": 194.0,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "86.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.9,
"t": 536.5,
"r": 231.2,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.2,
"t": 536.5,
"r": 279.6,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "86.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.3,
"t": 548.5,
"r": 117.4,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 137.9,
"t": 548.5,
"r": 150.6,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "TB",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.6,
"t": 548.5,
"r": 194.0,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "89.6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.9,
"t": 548.5,
"r": 231.2,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.2,
"t": 548.3,
"r": 279.6,
"b": 557.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "89.6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.3,
"t": 568.0,
"r": 117.4,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 568.0,
"r": 153.7,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "STN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.6,
"t": 568.0,
"r": 194.0,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "96.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.8,
"t": 568.0,
"r": 238.3,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "95.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.2,
"t": 568.0,
"r": 279.6,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "96.7",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
"8": {
"label": "table",
"id": 8,
"page_no": 6,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 308.4,
"t": 247.9,
"r": 533.6,
"b": 303.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.3,
"r_y0": 262.6,
"r_x1": 365.3,
"r_y1": 262.6,
"r_x2": 365.3,
"r_y2": 253.7,
"r_x3": 339.3,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 401.0,
"r_y0": 262.6,
"r_x1": 430.9,
"r_y1": 262.6,
"r_x2": 430.9,
"r_y2": 253.7,
"r_x3": 401.0,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 454.1,
"r_y0": 262.6,
"r_x1": 474.6,
"r_y1": 262.6,
"r_x2": 474.6,
"r_y2": 253.7,
"r_x3": 454.1,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "mAP",
"orig": "mAP",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 486.5,
"r_y0": 262.6,
"r_x1": 527.2,
"r_y1": 262.6,
"r_x2": 527.2,
"r_y2": 253.7,
"r_x3": 486.5,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "mAP (PP)",
"orig": "mAP (PP)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.7,
"r_y0": 279.5,
"r_x1": 377.0,
"r_y1": 279.5,
"r_x2": 377.0,
"r_y2": 270.6,
"r_x3": 327.7,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "EDD+BBox",
"orig": "EDD+BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 279.5,
"r_x1": 438.3,
"r_y1": 279.5,
"r_x2": 438.3,
"r_y2": 270.6,
"r_x3": 393.7,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 279.5,
"r_x1": 473.1,
"r_y1": 279.5,
"r_x2": 473.1,
"r_y2": 270.6,
"r_x3": 455.6,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "79.2",
"orig": "79.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.2,
"r_y0": 279.5,
"r_x1": 515.6,
"r_y1": 279.5,
"r_x2": 515.6,
"r_y2": 270.6,
"r_x3": 498.2,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "82.7",
"orig": "82.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 291.5,
"r_x1": 377.9,
"r_y1": 291.5,
"r_x2": 377.9,
"r_y2": 282.6,
"r_x3": 326.8,
"r_y3": 282.6,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 291.5,
"r_x1": 438.3,
"r_y1": 291.5,
"r_x2": 438.3,
"r_y2": 282.6,
"r_x3": 393.7,
"r_y3": 282.6,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 291.4,
"r_x1": 473.1,
"r_y1": 291.4,
"r_x2": 473.1,
"r_y2": 282.5,
"r_x3": 455.6,
"r_y3": 282.5,
"coord_origin": "TOPLEFT"
},
"text": "82.1",
"orig": "82.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.2,
"r_y0": 291.4,
"r_x1": 515.6,
"r_y1": 291.4,
"r_x2": 515.6,
"r_y2": 282.5,
"r_x3": 498.2,
"r_y3": 282.5,
"coord_origin": "TOPLEFT"
},
"text": "86.8",
"orig": "86.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 303.4,
"r_x1": 377.9,
"r_y1": 303.4,
"r_x2": 377.9,
"r_y2": 294.5,
"r_x3": 326.8,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.8,
"r_y0": 303.4,
"r_x1": 442.2,
"r_y1": 303.4,
"r_x2": 442.2,
"r_y2": 294.5,
"r_x3": 389.8,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 303.4,
"r_x1": 473.1,
"r_y1": 303.4,
"r_x2": 473.1,
"r_y2": 294.5,
"r_x3": 455.6,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "87.7",
"orig": "87.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 505.2,
"r_y0": 303.4,
"r_x1": 508.5,
"r_y1": 303.4,
"r_x2": 508.5,
"r_y2": 294.5,
"r_x3": 505.2,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 83,
"label": "text",
"bbox": {
"l": 339.3,
"t": 253.7,
"r": 365.3,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.3,
"r_y0": 262.6,
"r_x1": 365.3,
"r_y1": 262.6,
"r_x2": 365.3,
"r_y2": 253.7,
"r_x3": 339.3,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 401.0,
"t": 253.7,
"r": 430.9,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 401.0,
"r_y0": 262.6,
"r_x1": 430.9,
"r_y1": 262.6,
"r_x2": 430.9,
"r_y2": 253.7,
"r_x3": 401.0,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 454.1,
"t": 253.7,
"r": 474.6,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 454.1,
"r_y0": 262.6,
"r_x1": 474.6,
"r_y1": 262.6,
"r_x2": 474.6,
"r_y2": 253.7,
"r_x3": 454.1,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "mAP",
"orig": "mAP",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 486.5,
"t": 253.7,
"r": 527.2,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 486.5,
"r_y0": 262.6,
"r_x1": 527.2,
"r_y1": 262.6,
"r_x2": 527.2,
"r_y2": 253.7,
"r_x3": 486.5,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "mAP (PP)",
"orig": "mAP (PP)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 327.7,
"t": 270.6,
"r": 377.0,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.7,
"r_y0": 279.5,
"r_x1": 377.0,
"r_y1": 279.5,
"r_x2": 377.0,
"r_y2": 270.6,
"r_x3": 327.7,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "EDD+BBox",
"orig": "EDD+BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 393.7,
"t": 270.6,
"r": 438.3,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 279.5,
"r_x1": 438.3,
"r_y1": 279.5,
"r_x2": 438.3,
"r_y2": 270.6,
"r_x3": 393.7,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 455.6,
"t": 270.6,
"r": 473.1,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 279.5,
"r_x1": 473.1,
"r_y1": 279.5,
"r_x2": 473.1,
"r_y2": 270.6,
"r_x3": 455.6,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "79.2",
"orig": "79.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 498.2,
"t": 270.6,
"r": 515.6,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.2,
"r_y0": 279.5,
"r_x1": 515.6,
"r_y1": 279.5,
"r_x2": 515.6,
"r_y2": 270.6,
"r_x3": 498.2,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "82.7",
"orig": "82.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 326.8,
"t": 282.6,
"r": 377.9,
"b": 291.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 291.5,
"r_x1": 377.9,
"r_y1": 291.5,
"r_x2": 377.9,
"r_y2": 282.6,
"r_x3": 326.8,
"r_y3": 282.6,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 393.7,
"t": 282.6,
"r": 438.3,
"b": 291.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 291.5,
"r_x1": 438.3,
"r_y1": 291.5,
"r_x2": 438.3,
"r_y2": 282.6,
"r_x3": 393.7,
"r_y3": 282.6,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 455.6,
"t": 282.5,
"r": 473.1,
"b": 291.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 291.4,
"r_x1": 473.1,
"r_y1": 291.4,
"r_x2": 473.1,
"r_y2": 282.5,
"r_x3": 455.6,
"r_y3": 282.5,
"coord_origin": "TOPLEFT"
},
"text": "82.1",
"orig": "82.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 498.2,
"t": 282.5,
"r": 515.6,
"b": 291.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.2,
"r_y0": 291.4,
"r_x1": 515.6,
"r_y1": 291.4,
"r_x2": 515.6,
"r_y2": 282.5,
"r_x3": 498.2,
"r_y3": 282.5,
"coord_origin": "TOPLEFT"
},
"text": "86.8",
"orig": "86.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 326.8,
"t": 294.5,
"r": 377.9,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 303.4,
"r_x1": 377.9,
"r_y1": 303.4,
"r_x2": 377.9,
"r_y2": 294.5,
"r_x3": 326.8,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 389.8,
"t": 294.5,
"r": 442.2,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.8,
"r_y0": 303.4,
"r_x1": 442.2,
"r_y1": 303.4,
"r_x2": 442.2,
"r_y2": 294.5,
"r_x3": 389.8,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 455.6,
"t": 294.5,
"r": 473.1,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 303.4,
"r_x1": 473.1,
"r_y1": 303.4,
"r_x2": 473.1,
"r_y2": 294.5,
"r_x3": 455.6,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "87.7",
"orig": "87.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 505.2,
"t": 294.5,
"r": 508.5,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 505.2,
"r_y0": 303.4,
"r_x1": 508.5,
"r_y1": 303.4,
"r_x2": 508.5,
"r_y2": 294.5,
"r_x3": 505.2,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 4,
"num_cols": 4,
"table_cells": [
{
"bbox": {
"l": 339.3,
"t": 253.7,
"r": 365.3,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Model",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 401.0,
"t": 253.7,
"r": 430.9,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Dataset",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 454.1,
"t": 253.7,
"r": 474.6,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "mAP",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 486.5,
"t": 253.7,
"r": 527.2,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "mAP (PP)",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 327.7,
"t": 270.6,
"r": 377.0,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD+BBox",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 393.7,
"t": 270.6,
"r": 438.3,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PubTabNet",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 455.6,
"t": 270.6,
"r": 473.1,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "79.2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 498.2,
"t": 270.6,
"r": 515.6,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "82.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 326.8,
"t": 282.6,
"r": 377.9,
"b": 291.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 393.7,
"t": 282.6,
"r": 438.3,
"b": 291.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PubTabNet",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 455.6,
"t": 282.5,
"r": 473.1,
"b": 291.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "82.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 498.2,
"t": 282.5,
"r": 515.6,
"b": 291.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "86.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 326.8,
"t": 294.5,
"r": 377.9,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 389.8,
"t": 294.5,
"r": 442.2,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "SynthTabNet",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 455.6,
"t": 294.5,
"r": 473.1,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "87.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 505.2,
"t": 294.5,
"r": 508.5,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
"5": {
"label": "table",
"id": 5,
"page_no": 6,
"cluster": {
"id": 5,
"label": "table",
"bbox": {
"l": 333.0,
"t": 540.3,
"r": 520.9,
"b": 643.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 358.0,
"r_y0": 561.1,
"r_x1": 384.0,
"r_y1": 561.1,
"r_x2": 384.0,
"r_y2": 552.2,
"r_x3": 358.0,
"r_y3": 552.2,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.0,
"r_y0": 555.2,
"r_x1": 473.9,
"r_y1": 555.2,
"r_x2": 473.9,
"r_y2": 546.3,
"r_x3": 449.0,
"r_y3": 546.3,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.5,
"r_y0": 567.1,
"r_x1": 436.7,
"r_y1": 567.1,
"r_x2": 436.7,
"r_y2": 558.2,
"r_x3": 408.5,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.7,
"r_y0": 567.1,
"r_x1": 485.1,
"r_y1": 567.1,
"r_x2": 485.1,
"r_y2": 558.2,
"r_x3": 448.7,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.4,
"r_y0": 567.1,
"r_x1": 512.1,
"r_y1": 567.1,
"r_x2": 512.1,
"r_y2": 558.2,
"r_x3": 499.4,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.7,
"r_y0": 584.1,
"r_x1": 384.4,
"r_y1": 584.1,
"r_x2": 384.4,
"r_y2": 575.2,
"r_x3": 357.7,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "Tabula",
"orig": "Tabula",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 584.1,
"r_x1": 431.3,
"r_y1": 584.1,
"r_x2": 431.3,
"r_y2": 575.2,
"r_x3": 413.9,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "78.0",
"orig": "78.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 584.1,
"r_x1": 475.6,
"r_y1": 584.1,
"r_x2": 475.6,
"r_y2": 575.2,
"r_x3": 458.2,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "57.8",
"orig": "57.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 584.1,
"r_x1": 514.5,
"r_y1": 584.1,
"r_x2": 514.5,
"r_y2": 575.2,
"r_x3": 497.0,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "67.9",
"orig": "67.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 350.7,
"r_y0": 596.0,
"r_x1": 391.3,
"r_y1": 596.0,
"r_x2": 391.3,
"r_y2": 587.1,
"r_x3": 350.7,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "Traprange",
"orig": "Traprange",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 596.0,
"r_x1": 431.3,
"r_y1": 596.0,
"r_x2": 431.3,
"r_y2": 587.1,
"r_x3": 413.9,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "60.8",
"orig": "60.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 596.0,
"r_x1": 475.6,
"r_y1": 596.0,
"r_x2": 475.6,
"r_y2": 587.1,
"r_x3": 458.2,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "49.9",
"orig": "49.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 596.0,
"r_x1": 514.5,
"r_y1": 596.0,
"r_x2": 514.5,
"r_y2": 587.1,
"r_x3": 497.0,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "55.4",
"orig": "55.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.1,
"r_y0": 608.0,
"r_x1": 387.9,
"r_y1": 608.0,
"r_x2": 387.9,
"r_y2": 599.1,
"r_x3": 354.1,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "Camelot",
"orig": "Camelot",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 608.0,
"r_x1": 431.3,
"r_y1": 608.0,
"r_x2": 431.3,
"r_y2": 599.1,
"r_x3": 413.9,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "80.0",
"orig": "80.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 608.0,
"r_x1": 475.6,
"r_y1": 608.0,
"r_x2": 475.6,
"r_y2": 599.1,
"r_x3": 458.2,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "66.0",
"orig": "66.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 608.0,
"r_x1": 514.5,
"r_y1": 608.0,
"r_x2": 514.5,
"r_y2": 599.1,
"r_x3": 497.0,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "73.0",
"orig": "73.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.6,
"r_y0": 619.9,
"r_x1": 395.5,
"r_y1": 619.9,
"r_x2": 395.5,
"r_y2": 611.0,
"r_x3": 346.6,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "Acrobat Pro",
"orig": "Acrobat Pro",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 619.9,
"r_x1": 431.3,
"r_y1": 619.9,
"r_x2": 431.3,
"r_y2": 611.0,
"r_x3": 413.9,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "68.9",
"orig": "68.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 619.9,
"r_x1": 475.6,
"r_y1": 619.9,
"r_x2": 475.6,
"r_y2": 611.0,
"r_x3": 458.2,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "61.8",
"orig": "61.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 619.9,
"r_x1": 514.5,
"r_y1": 619.9,
"r_x2": 514.5,
"r_y2": 611.0,
"r_x3": 497.0,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "65.3",
"orig": "65.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.8,
"r_y0": 631.9,
"r_x1": 381.3,
"r_y1": 631.9,
"r_x2": 381.3,
"r_y2": 623.0,
"r_x3": 360.8,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 631.9,
"r_x1": 431.3,
"r_y1": 631.9,
"r_x2": 431.3,
"r_y2": 623.0,
"r_x3": 413.9,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "91.2",
"orig": "91.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 631.9,
"r_x1": 475.6,
"r_y1": 631.9,
"r_x2": 475.6,
"r_y2": 623.0,
"r_x3": 458.2,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "85.4",
"orig": "85.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 631.9,
"r_x1": 514.5,
"r_y1": 631.9,
"r_x2": 514.5,
"r_y2": 623.0,
"r_x3": 497.0,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "88.3",
"orig": "88.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.5,
"r_y0": 643.8,
"r_x1": 396.6,
"r_y1": 643.8,
"r_x2": 396.6,
"r_y2": 634.9,
"r_x3": 345.5,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 643.8,
"r_x1": 431.3,
"r_y1": 643.8,
"r_x2": 431.3,
"r_y2": 634.9,
"r_x3": 413.9,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "95.4",
"orig": "95.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 643.8,
"r_x1": 475.6,
"r_y1": 643.8,
"r_x2": 475.6,
"r_y2": 634.9,
"r_x3": 458.2,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "90.1",
"orig": "90.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 643.8,
"r_x1": 514.5,
"r_y1": 643.8,
"r_x2": 514.5,
"r_y2": 634.8,
"r_x3": 497.0,
"r_y3": 634.8,
"coord_origin": "TOPLEFT"
},
"text": "93.6",
"orig": "93.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 99,
"label": "text",
"bbox": {
"l": 358.0,
"t": 552.2,
"r": 384.0,
"b": 561.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 358.0,
"r_y0": 561.1,
"r_x1": 384.0,
"r_y1": 561.1,
"r_x2": 384.0,
"r_y2": 552.2,
"r_x3": 358.0,
"r_y3": 552.2,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 449.0,
"t": 546.3,
"r": 473.9,
"b": 555.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.0,
"r_y0": 555.2,
"r_x1": 473.9,
"r_y1": 555.2,
"r_x2": 473.9,
"r_y2": 546.3,
"r_x3": 449.0,
"r_y3": 546.3,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 408.5,
"t": 558.2,
"r": 436.7,
"b": 567.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.5,
"r_y0": 567.1,
"r_x1": 436.7,
"r_y1": 567.1,
"r_x2": 436.7,
"r_y2": 558.2,
"r_x3": 408.5,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 448.7,
"t": 558.2,
"r": 485.1,
"b": 567.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.7,
"r_y0": 567.1,
"r_x1": 485.1,
"r_y1": 567.1,
"r_x2": 485.1,
"r_y2": 558.2,
"r_x3": 448.7,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 499.4,
"t": 558.2,
"r": 512.1,
"b": 567.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.4,
"r_y0": 567.1,
"r_x1": 512.1,
"r_y1": 567.1,
"r_x2": 512.1,
"r_y2": 558.2,
"r_x3": 499.4,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 357.7,
"t": 575.2,
"r": 384.4,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.7,
"r_y0": 584.1,
"r_x1": 384.4,
"r_y1": 584.1,
"r_x2": 384.4,
"r_y2": 575.2,
"r_x3": 357.7,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "Tabula",
"orig": "Tabula",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 105,
"label": "text",
"bbox": {
"l": 413.9,
"t": 575.2,
"r": 431.3,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 584.1,
"r_x1": 431.3,
"r_y1": 584.1,
"r_x2": 431.3,
"r_y2": 575.2,
"r_x3": 413.9,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "78.0",
"orig": "78.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 106,
"label": "text",
"bbox": {
"l": 458.2,
"t": 575.2,
"r": 475.6,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 584.1,
"r_x1": 475.6,
"r_y1": 584.1,
"r_x2": 475.6,
"r_y2": 575.2,
"r_x3": 458.2,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "57.8",
"orig": "57.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 107,
"label": "text",
"bbox": {
"l": 497.0,
"t": 575.2,
"r": 514.5,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 584.1,
"r_x1": 514.5,
"r_y1": 584.1,
"r_x2": 514.5,
"r_y2": 575.2,
"r_x3": 497.0,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "67.9",
"orig": "67.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 108,
"label": "text",
"bbox": {
"l": 350.7,
"t": 587.1,
"r": 391.3,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 350.7,
"r_y0": 596.0,
"r_x1": 391.3,
"r_y1": 596.0,
"r_x2": 391.3,
"r_y2": 587.1,
"r_x3": 350.7,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "Traprange",
"orig": "Traprange",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 109,
"label": "text",
"bbox": {
"l": 413.9,
"t": 587.1,
"r": 431.3,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 596.0,
"r_x1": 431.3,
"r_y1": 596.0,
"r_x2": 431.3,
"r_y2": 587.1,
"r_x3": 413.9,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "60.8",
"orig": "60.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 110,
"label": "text",
"bbox": {
"l": 458.2,
"t": 587.1,
"r": 475.6,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 596.0,
"r_x1": 475.6,
"r_y1": 596.0,
"r_x2": 475.6,
"r_y2": 587.1,
"r_x3": 458.2,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "49.9",
"orig": "49.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 111,
"label": "text",
"bbox": {
"l": 497.0,
"t": 587.1,
"r": 514.5,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 596.0,
"r_x1": 514.5,
"r_y1": 596.0,
"r_x2": 514.5,
"r_y2": 587.1,
"r_x3": 497.0,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "55.4",
"orig": "55.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 112,
"label": "text",
"bbox": {
"l": 354.1,
"t": 599.1,
"r": 387.9,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.1,
"r_y0": 608.0,
"r_x1": 387.9,
"r_y1": 608.0,
"r_x2": 387.9,
"r_y2": 599.1,
"r_x3": 354.1,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "Camelot",
"orig": "Camelot",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 113,
"label": "text",
"bbox": {
"l": 413.9,
"t": 599.1,
"r": 431.3,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 608.0,
"r_x1": 431.3,
"r_y1": 608.0,
"r_x2": 431.3,
"r_y2": 599.1,
"r_x3": 413.9,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "80.0",
"orig": "80.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 114,
"label": "text",
"bbox": {
"l": 458.2,
"t": 599.1,
"r": 475.6,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 608.0,
"r_x1": 475.6,
"r_y1": 608.0,
"r_x2": 475.6,
"r_y2": 599.1,
"r_x3": 458.2,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "66.0",
"orig": "66.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 115,
"label": "text",
"bbox": {
"l": 497.0,
"t": 599.1,
"r": 514.5,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 608.0,
"r_x1": 514.5,
"r_y1": 608.0,
"r_x2": 514.5,
"r_y2": 599.1,
"r_x3": 497.0,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "73.0",
"orig": "73.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 116,
"label": "text",
"bbox": {
"l": 346.6,
"t": 611.0,
"r": 395.5,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.6,
"r_y0": 619.9,
"r_x1": 395.5,
"r_y1": 619.9,
"r_x2": 395.5,
"r_y2": 611.0,
"r_x3": 346.6,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "Acrobat Pro",
"orig": "Acrobat Pro",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 117,
"label": "text",
"bbox": {
"l": 413.9,
"t": 611.0,
"r": 431.3,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 619.9,
"r_x1": 431.3,
"r_y1": 619.9,
"r_x2": 431.3,
"r_y2": 611.0,
"r_x3": 413.9,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "68.9",
"orig": "68.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 118,
"label": "text",
"bbox": {
"l": 458.2,
"t": 611.0,
"r": 475.6,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 619.9,
"r_x1": 475.6,
"r_y1": 619.9,
"r_x2": 475.6,
"r_y2": 611.0,
"r_x3": 458.2,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "61.8",
"orig": "61.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 119,
"label": "text",
"bbox": {
"l": 497.0,
"t": 611.0,
"r": 514.5,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 619.9,
"r_x1": 514.5,
"r_y1": 619.9,
"r_x2": 514.5,
"r_y2": 611.0,
"r_x3": 497.0,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "65.3",
"orig": "65.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 120,
"label": "text",
"bbox": {
"l": 360.8,
"t": 623.0,
"r": 381.3,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.8,
"r_y0": 631.9,
"r_x1": 381.3,
"r_y1": 631.9,
"r_x2": 381.3,
"r_y2": 623.0,
"r_x3": 360.8,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 121,
"label": "text",
"bbox": {
"l": 413.9,
"t": 623.0,
"r": 431.3,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 631.9,
"r_x1": 431.3,
"r_y1": 631.9,
"r_x2": 431.3,
"r_y2": 623.0,
"r_x3": 413.9,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "91.2",
"orig": "91.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 122,
"label": "text",
"bbox": {
"l": 458.2,
"t": 623.0,
"r": 475.6,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 631.9,
"r_x1": 475.6,
"r_y1": 631.9,
"r_x2": 475.6,
"r_y2": 623.0,
"r_x3": 458.2,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "85.4",
"orig": "85.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 123,
"label": "text",
"bbox": {
"l": 497.0,
"t": 623.0,
"r": 514.5,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 631.9,
"r_x1": 514.5,
"r_y1": 631.9,
"r_x2": 514.5,
"r_y2": 623.0,
"r_x3": 497.0,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "88.3",
"orig": "88.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 124,
"label": "text",
"bbox": {
"l": 345.5,
"t": 634.9,
"r": 396.6,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.5,
"r_y0": 643.8,
"r_x1": 396.6,
"r_y1": 643.8,
"r_x2": 396.6,
"r_y2": 634.9,
"r_x3": 345.5,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 125,
"label": "text",
"bbox": {
"l": 413.9,
"t": 634.9,
"r": 431.3,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 643.8,
"r_x1": 431.3,
"r_y1": 643.8,
"r_x2": 431.3,
"r_y2": 634.9,
"r_x3": 413.9,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "95.4",
"orig": "95.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 126,
"label": "text",
"bbox": {
"l": 458.2,
"t": 634.9,
"r": 475.6,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 643.8,
"r_x1": 475.6,
"r_y1": 643.8,
"r_x2": 475.6,
"r_y2": 634.9,
"r_x3": 458.2,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "90.1",
"orig": "90.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 127,
"label": "text",
"bbox": {
"l": 497.0,
"t": 634.8,
"r": 514.5,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 643.8,
"r_x1": 514.5,
"r_y1": 643.8,
"r_x2": 514.5,
"r_y2": 634.8,
"r_x3": 497.0,
"r_y3": 634.8,
"coord_origin": "TOPLEFT"
},
"text": "93.6",
"orig": "93.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"fcel",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 7,
"num_cols": 4,
"table_cells": [
{
"bbox": {
"l": 358.0,
"t": 552.2,
"r": 384.0,
"b": 561.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Model",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.0,
"t": 546.3,
"r": 473.9,
"b": 555.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "TEDS Complex",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 408.5,
"t": 558.2,
"r": 436.7,
"b": 567.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Simple",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 499.4,
"t": 558.2,
"r": 512.1,
"b": 567.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "All",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 357.7,
"t": 575.2,
"r": 384.4,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Tabula",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 575.2,
"r": 431.3,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "78.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.2,
"t": 575.2,
"r": 475.6,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "57.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.0,
"t": 575.2,
"r": 514.5,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "67.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 350.7,
"t": 587.1,
"r": 391.3,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Traprange",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 587.1,
"r": 431.3,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "60.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.2,
"t": 587.1,
"r": 475.6,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "49.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.0,
"t": 587.1,
"r": 514.5,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "55.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 354.1,
"t": 599.1,
"r": 387.9,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Camelot",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 599.1,
"r": 431.3,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "80.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.2,
"t": 599.1,
"r": 475.6,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "66.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.0,
"t": 599.1,
"r": 514.5,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "73.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 346.6,
"t": 611.0,
"r": 395.5,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Acrobat Pro",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 611.0,
"r": 431.3,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "68.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.2,
"t": 611.0,
"r": 475.6,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "61.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.0,
"t": 611.0,
"r": 514.5,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "65.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 360.8,
"t": 623.0,
"r": 381.3,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 623.0,
"r": 431.3,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "91.2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.2,
"t": 623.0,
"r": 475.6,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "85.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.0,
"t": 623.0,
"r": 514.5,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "88.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 345.5,
"t": 634.9,
"r": 396.6,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 634.9,
"r": 431.3,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "95.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.2,
"t": 634.9,
"r": 475.6,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "90.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.0,
"t": 634.8,
"r": 514.5,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "93.6",
"column_header": false,
"row_header": false,
"row_section": false
}
]
}
}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "section_header",
"id": 10,
"page_no": 6,
"cluster": {
"id": 10,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 74.4,
"r": 167.9,
"b": 84.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.3,
"r_x1": 63.7,
"r_y1": 84.3,
"r_x2": 63.7,
"r_y2": 74.4,
"r_x3": 50.1,
"r_y3": 74.4,
"coord_origin": "TOPLEFT"
},
"text": "5.3.",
"orig": "5.3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 72.8,
"r_y0": 84.3,
"r_x1": 167.9,
"r_y1": 84.3,
"r_x2": 167.9,
"r_y2": 74.4,
"r_x3": 72.8,
"r_y3": 74.4,
"coord_origin": "TOPLEFT"
},
"text": "Datasets and Metrics",
"orig": "Datasets and Metrics",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5.3. Datasets and Metrics"
},
{
"label": "text",
"id": 1,
"page_no": 6,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.1,
"t": 93.4,
"r": 286.4,
"b": 138.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 102.3,
"r_x1": 286.4,
"r_y1": 102.3,
"r_x2": 286.4,
"r_y2": 93.4,
"r_x3": 62.1,
"r_y3": 93.4,
"coord_origin": "TOPLEFT"
},
"text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-",
"orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 114.2,
"r_x1": 286.4,
"r_y1": 114.2,
"r_x2": 286.4,
"r_y2": 105.3,
"r_x3": 50.1,
"r_y3": 105.3,
"coord_origin": "TOPLEFT"
},
"text": "ric was introduced in [37]. It represents the prediction, and",
"orig": "ric was introduced in [37]. It represents the prediction, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 126.2,
"r_x1": 286.4,
"r_y1": 126.2,
"r_x2": 286.4,
"r_y2": 117.3,
"r_x3": 50.1,
"r_y3": 117.3,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth as a tree structure of HTML tags. This simi-",
"orig": "ground-truth as a tree structure of HTML tags. This simi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 138.1,
"r_x1": 136.7,
"r_y1": 138.1,
"r_x2": 136.7,
"r_y2": 129.2,
"r_x3": 50.1,
"r_y3": 129.2,
"coord_origin": "TOPLEFT"
},
"text": "larity is calculated as:",
"orig": "larity is calculated as:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The Tree-Edit-Distance-Based Similarity (TEDS) metric was introduced in [37]. It represents the prediction, and ground-truth as a tree structure of HTML tags. This similarity is calculated as:"
},
{
"label": "formula",
"id": 13,
"page_no": 6,
"cluster": {
"id": 13,
"label": "formula",
"bbox": {
"l": 86.2,
"t": 150.3,
"r": 286.4,
"b": 172.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.2,
"r_y0": 165.9,
"r_x1": 118.9,
"r_y1": 165.9,
"r_x2": 118.9,
"r_y2": 157.1,
"r_x3": 86.2,
"r_y3": 157.1,
"coord_origin": "TOPLEFT"
},
"text": "TEDS (",
"orig": "TEDS (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 118.9,
"r_y0": 165.9,
"r_x1": 143.3,
"r_y1": 165.9,
"r_x2": 143.3,
"r_y2": 157.1,
"r_x3": 118.9,
"r_y3": 157.1,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$, T$_{b}$",
"orig": "T$_{a}$, T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.8,
"r_y0": 165.9,
"r_x1": 165.9,
"r_y1": 165.9,
"r_x2": 165.9,
"r_y2": 157.1,
"r_x3": 143.8,
"r_y3": 157.1,
"coord_origin": "TOPLEFT"
},
"text": ") = 1",
"orig": ") = 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 168.1,
"r_y0": 165.9,
"r_x1": 175.9,
"r_y1": 165.9,
"r_x2": 175.9,
"r_y2": 156.5,
"r_x3": 168.1,
"r_y3": 156.5,
"coord_origin": "TOPLEFT"
},
"text": "\u2212",
"orig": "\u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 179.3,
"r_y0": 159.2,
"r_x1": 222.0,
"r_y1": 159.2,
"r_x2": 222.0,
"r_y2": 150.3,
"r_x3": 179.3,
"r_y3": 150.3,
"coord_origin": "TOPLEFT"
},
"text": "EditDist (",
"orig": "EditDist (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 222.0,
"r_y0": 159.2,
"r_x1": 246.3,
"r_y1": 159.2,
"r_x2": 246.3,
"r_y2": 150.3,
"r_x3": 222.0,
"r_y3": 150.3,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$, T$_{b}$",
"orig": "T$_{a}$, T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.8,
"r_y0": 159.2,
"r_x1": 250.7,
"r_y1": 159.2,
"r_x2": 250.7,
"r_y2": 150.3,
"r_x3": 246.8,
"r_y3": 150.3,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.2,
"r_y0": 172.7,
"r_x1": 206.3,
"r_y1": 172.7,
"r_x2": 206.3,
"r_y2": 163.9,
"r_x3": 182.2,
"r_y3": 163.9,
"coord_origin": "TOPLEFT"
},
"text": "max (",
"orig": "max (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.3,
"r_y0": 172.7,
"r_x1": 209.1,
"r_y1": 172.7,
"r_x2": 209.1,
"r_y2": 163.3,
"r_x3": 206.3,
"r_y3": 163.3,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.1,
"r_y0": 172.7,
"r_x1": 219.2,
"r_y1": 172.7,
"r_x2": 219.2,
"r_y2": 163.9,
"r_x3": 209.1,
"r_y3": 163.9,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$",
"orig": "T$_{a}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 219.7,
"r_y0": 172.7,
"r_x1": 222.5,
"r_y1": 172.7,
"r_x2": 222.5,
"r_y2": 163.3,
"r_x3": 219.7,
"r_y3": 163.3,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 224.1,
"r_y0": 172.7,
"r_x1": 226.9,
"r_y1": 172.7,
"r_x2": 226.9,
"r_y2": 163.9,
"r_x3": 224.1,
"r_y3": 163.9,
"coord_origin": "TOPLEFT"
},
"text": ",",
"orig": ",",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 228.6,
"r_y0": 172.7,
"r_x1": 231.3,
"r_y1": 172.7,
"r_x2": 231.3,
"r_y2": 163.3,
"r_x3": 228.6,
"r_y3": 163.3,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 231.3,
"r_y0": 172.7,
"r_x1": 240.6,
"r_y1": 172.7,
"r_x2": 240.6,
"r_y2": 163.9,
"r_x3": 231.3,
"r_y3": 163.9,
"coord_origin": "TOPLEFT"
},
"text": "T$_{b}$",
"orig": "T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.1,
"r_y0": 172.7,
"r_x1": 243.9,
"r_y1": 172.7,
"r_x2": 243.9,
"r_y2": 163.3,
"r_x3": 241.1,
"r_y3": 163.3,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 243.9,
"r_y0": 172.7,
"r_x1": 247.8,
"r_y1": 172.7,
"r_x2": 247.8,
"r_y2": 163.9,
"r_x3": 243.9,
"r_y3": 163.9,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.7,
"r_y0": 166.1,
"r_x1": 286.4,
"r_y1": 166.1,
"r_x2": 286.4,
"r_y2": 157.2,
"r_x3": 274.7,
"r_y3": 157.2,
"coord_origin": "TOPLEFT"
},
"text": "(3)",
"orig": "(3)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TEDS ( T$_{a}$, T$_{b}$ ) = 1 \u2212 EditDist ( T$_{a}$, T$_{b}$ ) max ( | T$_{a}$ | , | T$_{b}$ | ) (3)"
},
{
"label": "text",
"id": 6,
"page_no": 6,
"cluster": {
"id": 6,
"label": "text",
"bbox": {
"l": 50.1,
"t": 181.0,
"r": 286.4,
"b": 214.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 190.1,
"r_x1": 86.4,
"r_y1": 190.1,
"r_x2": 86.4,
"r_y2": 181.2,
"r_x3": 62.1,
"r_y3": 181.2,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.6,
"r_y0": 189.8,
"r_x1": 98.7,
"r_y1": 189.8,
"r_x2": 98.7,
"r_y2": 181.0,
"r_x3": 88.6,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$",
"orig": "T$_{a}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.4,
"r_y0": 190.1,
"r_x1": 115.8,
"r_y1": 190.1,
"r_x2": 115.8,
"r_y2": 181.2,
"r_x3": 101.4,
"r_y3": 181.2,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 118.0,
"r_y0": 189.8,
"r_x1": 127.3,
"r_y1": 189.8,
"r_x2": 127.3,
"r_y2": 181.0,
"r_x3": 118.0,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "T$_{b}$",
"orig": "T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 130.0,
"r_y0": 190.1,
"r_x1": 286.4,
"r_y1": 190.1,
"r_x2": 286.4,
"r_y2": 181.2,
"r_x3": 130.0,
"r_y3": 181.2,
"coord_origin": "TOPLEFT"
},
"text": "represent tables in tree structure HTML",
"orig": "represent tables in tree structure HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 202.0,
"r_x1": 252.8,
"r_y1": 202.0,
"r_x2": 252.8,
"r_y2": 193.1,
"r_x3": 50.1,
"r_y3": 193.1,
"coord_origin": "TOPLEFT"
},
"text": "format. EditDist denotes the tree-edit distance, and",
"orig": "format. EditDist denotes the tree-edit distance, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.2,
"r_y0": 201.8,
"r_x1": 257.9,
"r_y1": 201.8,
"r_x2": 257.9,
"r_y2": 192.4,
"r_x3": 255.2,
"r_y3": 192.4,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 257.9,
"r_y0": 201.8,
"r_x1": 263.8,
"r_y1": 201.8,
"r_x2": 263.8,
"r_y2": 193.0,
"r_x3": 257.9,
"r_y3": 193.0,
"coord_origin": "TOPLEFT"
},
"text": "T",
"orig": "T",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 265.2,
"r_y0": 201.8,
"r_x1": 267.9,
"r_y1": 201.8,
"r_x2": 267.9,
"r_y2": 192.4,
"r_x3": 265.2,
"r_y3": 192.4,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 270.3,
"r_y0": 202.0,
"r_x1": 286.4,
"r_y1": 202.0,
"r_x2": 286.4,
"r_y2": 193.1,
"r_x3": 270.3,
"r_y3": 193.1,
"coord_origin": "TOPLEFT"
},
"text": "rep-",
"orig": "rep-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 214.0,
"r_x1": 172.1,
"r_y1": 214.0,
"r_x2": 172.1,
"r_y2": 205.1,
"r_x3": 50.1,
"r_y3": 205.1,
"coord_origin": "TOPLEFT"
},
"text": "resents the number of nodes in",
"orig": "resents the number of nodes in",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 174.6,
"r_y0": 213.8,
"r_x1": 180.4,
"r_y1": 213.8,
"r_x2": 180.4,
"r_y2": 204.9,
"r_x3": 174.6,
"r_y3": 204.9,
"coord_origin": "TOPLEFT"
},
"text": "T",
"orig": "T",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 181.8,
"r_y0": 214.0,
"r_x1": 184.3,
"r_y1": 214.0,
"r_x2": 184.3,
"r_y2": 205.1,
"r_x3": 181.8,
"r_y3": 205.1,
"coord_origin": "TOPLEFT"
},
"text": ".",
"orig": ".",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "where T$_{a}$ and T$_{b}$ represent tables in tree structure HTML format. EditDist denotes the tree-edit distance, and | T | represents the number of nodes in T ."
},
{
"label": "section_header",
"id": 9,
"page_no": 6,
"cluster": {
"id": 9,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 224.8,
"r": 170.5,
"b": 234.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 234.7,
"r_x1": 64.6,
"r_y1": 234.7,
"r_x2": 64.6,
"r_y2": 224.8,
"r_x3": 50.1,
"r_y3": 224.8,
"coord_origin": "TOPLEFT"
},
"text": "5.4.",
"orig": "5.4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.2,
"r_y0": 234.7,
"r_x1": 170.5,
"r_y1": 234.7,
"r_x2": 170.5,
"r_y2": 224.8,
"r_x3": 74.2,
"r_y3": 224.8,
"coord_origin": "TOPLEFT"
},
"text": "Quantitative Analysis",
"orig": "Quantitative Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5.4. Quantitative Analysis"
},
{
"label": "text",
"id": 2,
"page_no": 6,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 50.1,
"t": 243.6,
"r": 286.4,
"b": 396.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 252.6,
"r_x1": 105.3,
"r_y1": 252.6,
"r_x2": 105.3,
"r_y2": 243.6,
"r_x3": 62.1,
"r_y3": 243.6,
"coord_origin": "TOPLEFT"
},
"text": "Structure.",
"orig": "Structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.1,
"r_y0": 252.7,
"r_x1": 184.7,
"r_y1": 252.7,
"r_x2": 184.7,
"r_y2": 243.8,
"r_x3": 112.1,
"r_y3": 243.8,
"coord_origin": "TOPLEFT"
},
"text": "As shown in Tab.",
"orig": "As shown in Tab.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 191.5,
"r_y0": 252.7,
"r_x1": 286.4,
"r_y1": 252.7,
"r_x2": 286.4,
"r_y2": 243.8,
"r_x3": 191.5,
"r_y3": 243.8,
"coord_origin": "TOPLEFT"
},
"text": "2, TableFormer outper-",
"orig": "2, TableFormer outper-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 264.6,
"r_x1": 286.4,
"r_y1": 264.6,
"r_x2": 286.4,
"r_y2": 255.7,
"r_x3": 50.1,
"r_y3": 255.7,
"coord_origin": "TOPLEFT"
},
"text": "forms all SOTA methods across different datasets by a large",
"orig": "forms all SOTA methods across different datasets by a large",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 276.6,
"r_x1": 286.4,
"r_y1": 276.6,
"r_x2": 286.4,
"r_y2": 267.7,
"r_x3": 50.1,
"r_y3": 267.7,
"coord_origin": "TOPLEFT"
},
"text": "margin for predicting the table structure from an image.",
"orig": "margin for predicting the table structure from an image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 288.5,
"r_x1": 286.4,
"r_y1": 288.5,
"r_x2": 286.4,
"r_y2": 279.6,
"r_x3": 50.1,
"r_y3": 279.6,
"coord_origin": "TOPLEFT"
},
"text": "All the more, our model outperforms pre-trained methods.",
"orig": "All the more, our model outperforms pre-trained methods.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 300.5,
"r_x1": 286.4,
"r_y1": 300.5,
"r_x2": 286.4,
"r_y2": 291.6,
"r_x3": 50.1,
"r_y3": 291.6,
"coord_origin": "TOPLEFT"
},
"text": "During the evaluation we do not apply any table filtering.",
"orig": "During the evaluation we do not apply any table filtering.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 312.5,
"r_x1": 286.4,
"r_y1": 312.5,
"r_x2": 286.4,
"r_y2": 303.5,
"r_x3": 50.1,
"r_y3": 303.5,
"coord_origin": "TOPLEFT"
},
"text": "We also provide our baseline results on the SynthTabNet",
"orig": "We also provide our baseline results on the SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 324.4,
"r_x1": 286.4,
"r_y1": 324.4,
"r_x2": 286.4,
"r_y2": 315.5,
"r_x3": 50.1,
"r_y3": 315.5,
"coord_origin": "TOPLEFT"
},
"text": "dataset. It has been observed that large tables (e.g. tables",
"orig": "dataset. It has been observed that large tables (e.g. tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 336.4,
"r_x1": 286.4,
"r_y1": 336.4,
"r_x2": 286.4,
"r_y2": 327.5,
"r_x3": 50.1,
"r_y3": 327.5,
"coord_origin": "TOPLEFT"
},
"text": "that occupy half of the page or more) yield poor predictions.",
"orig": "that occupy half of the page or more) yield poor predictions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 348.3,
"r_x1": 286.4,
"r_y1": 348.3,
"r_x2": 286.4,
"r_y2": 339.4,
"r_x3": 50.1,
"r_y3": 339.4,
"coord_origin": "TOPLEFT"
},
"text": "We attribute this issue to the image resizing during the pre-",
"orig": "We attribute this issue to the image resizing during the pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 360.3,
"r_x1": 286.4,
"r_y1": 360.3,
"r_x2": 286.4,
"r_y2": 351.4,
"r_x3": 50.1,
"r_y3": 351.4,
"coord_origin": "TOPLEFT"
},
"text": "processing step, that produces downsampled images with",
"orig": "processing step, that produces downsampled images with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 372.2,
"r_x1": 286.4,
"r_y1": 372.2,
"r_x2": 286.4,
"r_y2": 363.3,
"r_x3": 50.1,
"r_y3": 363.3,
"coord_origin": "TOPLEFT"
},
"text": "indistinguishable features. This problem can be addressed",
"orig": "indistinguishable features. This problem can be addressed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 384.2,
"r_x1": 286.4,
"r_y1": 384.2,
"r_x2": 286.4,
"r_y2": 375.3,
"r_x3": 50.1,
"r_y3": 375.3,
"coord_origin": "TOPLEFT"
},
"text": "by treating such big tables with a separate model which ac-",
"orig": "by treating such big tables with a separate model which ac-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 396.1,
"r_x1": 170.0,
"r_y1": 396.1,
"r_x2": 170.0,
"r_y2": 387.2,
"r_x3": 50.1,
"r_y3": 387.2,
"coord_origin": "TOPLEFT"
},
"text": "cepts a large input image size.",
"orig": "cepts a large input image size.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Structure. As shown in Tab. 2, TableFormer outperforms all SOTA methods across different datasets by a large margin for predicting the table structure from an image. All the more, our model outperforms pre-trained methods. During the evaluation we do not apply any table filtering. We also provide our baseline results on the SynthTabNet dataset. It has been observed that large tables (e.g. tables that occupy half of the page or more) yield poor predictions. We attribute this issue to the image resizing during the preprocessing step, that produces downsampled images with indistinguishable features. This problem can be addressed by treating such big tables with a separate model which accepts a large input image size."
},
{
"label": "table",
"id": 0,
"page_no": 6,
"cluster": {
"id": 0,
"label": "table",
"bbox": {
"l": 53.4,
"t": 409.1,
"r": 283.0,
"b": 582.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.8,
"r_y0": 429.6,
"r_x1": 104.9,
"r_y1": 429.6,
"r_x2": 104.9,
"r_y2": 420.7,
"r_x3": 78.8,
"r_y3": 420.7,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.2,
"r_y0": 423.6,
"r_x1": 236.1,
"r_y1": 423.6,
"r_x2": 236.1,
"r_y2": 414.7,
"r_x3": 211.2,
"r_y3": 414.7,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 129.3,
"r_y0": 435.6,
"r_x1": 159.2,
"r_y1": 435.6,
"r_x2": 159.2,
"r_y2": 426.7,
"r_x3": 129.3,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.2,
"r_y0": 435.6,
"r_x1": 199.4,
"r_y1": 435.6,
"r_x2": 199.4,
"r_y2": 426.7,
"r_x3": 171.2,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.4,
"r_y0": 435.6,
"r_x1": 247.7,
"r_y1": 435.6,
"r_x2": 247.7,
"r_y2": 426.7,
"r_x3": 211.4,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 264.5,
"r_y0": 435.6,
"r_x1": 277.3,
"r_y1": 435.6,
"r_x2": 277.3,
"r_y2": 426.7,
"r_x3": 264.5,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 452.5,
"r_x1": 102.1,
"r_y1": 452.5,
"r_x2": 102.1,
"r_y2": 443.6,
"r_x3": 81.6,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 452.5,
"r_x1": 153.7,
"r_y1": 452.5,
"r_x2": 153.7,
"r_y2": 443.6,
"r_x3": 134.9,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 452.5,
"r_x1": 194.0,
"r_y1": 452.5,
"r_x2": 194.0,
"r_y2": 443.6,
"r_x3": 176.6,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "91.1",
"orig": "91.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 452.5,
"r_x1": 238.3,
"r_y1": 452.5,
"r_x2": 238.3,
"r_y2": 443.6,
"r_x3": 220.8,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "88.7",
"orig": "88.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 452.5,
"r_x1": 279.6,
"r_y1": 452.5,
"r_x2": 279.6,
"r_y2": 443.6,
"r_x3": 262.2,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "89.9",
"orig": "89.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.2,
"r_y0": 464.5,
"r_x1": 101.5,
"r_y1": 464.5,
"r_x2": 101.5,
"r_y2": 455.6,
"r_x3": 82.2,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 464.5,
"r_x1": 153.7,
"r_y1": 464.5,
"r_x2": 153.7,
"r_y2": 455.6,
"r_x3": 134.9,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 464.5,
"r_x1": 186.9,
"r_y1": 464.5,
"r_x2": 186.9,
"r_y2": 455.6,
"r_x3": 183.6,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 464.5,
"r_x1": 231.2,
"r_y1": 464.5,
"r_x2": 231.2,
"r_y2": 455.6,
"r_x3": 227.9,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 464.5,
"r_x1": 282.1,
"r_y1": 464.5,
"r_x2": 282.1,
"r_y2": 455.6,
"r_x3": 259.7,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "93.01",
"orig": "93.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 477.0,
"r_x1": 117.4,
"r_y1": 477.0,
"r_x2": 117.4,
"r_y2": 468.1,
"r_x3": 66.3,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 477.0,
"r_x1": 153.7,
"r_y1": 477.0,
"r_x2": 153.7,
"r_y2": 468.1,
"r_x3": 134.9,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 477.0,
"r_x1": 194.0,
"r_y1": 477.0,
"r_x2": 194.0,
"r_y2": 468.1,
"r_x3": 176.6,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "98.5",
"orig": "98.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 477.0,
"r_x1": 238.3,
"r_y1": 477.0,
"r_x2": 238.3,
"r_y2": 468.1,
"r_x3": 220.8,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "95.0",
"orig": "95.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 477.0,
"r_x1": 282.1,
"r_y1": 477.0,
"r_x2": 282.1,
"r_y2": 468.0,
"r_x3": 259.7,
"r_y3": 468.0,
"coord_origin": "TOPLEFT"
},
"text": "96.75",
"orig": "96.75",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 492.2,
"r_x1": 102.1,
"r_y1": 492.2,
"r_x2": 102.1,
"r_y2": 483.3,
"r_x3": 81.6,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 492.2,
"r_x1": 153.7,
"r_y1": 492.2,
"r_x2": 153.7,
"r_y2": 483.3,
"r_x3": 134.9,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 492.2,
"r_x1": 194.0,
"r_y1": 492.2,
"r_x2": 194.0,
"r_y2": 483.3,
"r_x3": 176.6,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "88.4",
"orig": "88.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.3,
"r_y0": 492.2,
"r_x1": 240.8,
"r_y1": 492.2,
"r_x2": 240.8,
"r_y2": 483.3,
"r_x3": 218.3,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "92.08",
"orig": "92.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 492.2,
"r_x1": 279.6,
"r_y1": 492.2,
"r_x2": 279.6,
"r_y2": 483.3,
"r_x3": 262.2,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "90.6",
"orig": "90.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.2,
"r_y0": 504.2,
"r_x1": 101.5,
"r_y1": 504.2,
"r_x2": 101.5,
"r_y2": 495.3,
"r_x3": 82.2,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 504.2,
"r_x1": 153.7,
"r_y1": 504.2,
"r_x2": 153.7,
"r_y2": 495.3,
"r_x3": 134.9,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 504.2,
"r_x1": 186.9,
"r_y1": 504.2,
"r_x2": 186.9,
"r_y2": 495.3,
"r_x3": 183.6,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 504.2,
"r_x1": 231.2,
"r_y1": 504.2,
"r_x2": 231.2,
"r_y2": 495.3,
"r_x3": 227.9,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 504.2,
"r_x1": 282.1,
"r_y1": 504.2,
"r_x2": 282.1,
"r_y2": 495.3,
"r_x3": 259.7,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "87.14",
"orig": "87.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.8,
"r_y0": 516.1,
"r_x1": 111.9,
"r_y1": 516.1,
"r_x2": 111.9,
"r_y2": 507.2,
"r_x3": 71.8,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "GTE (FT)",
"orig": "GTE (FT)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 516.1,
"r_x1": 153.7,
"r_y1": 516.1,
"r_x2": 153.7,
"r_y2": 507.2,
"r_x3": 134.9,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 516.1,
"r_x1": 186.9,
"r_y1": 516.1,
"r_x2": 186.9,
"r_y2": 507.2,
"r_x3": 183.6,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 516.1,
"r_x1": 231.2,
"r_y1": 516.1,
"r_x2": 231.2,
"r_y2": 507.2,
"r_x3": 227.9,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 516.1,
"r_x1": 282.1,
"r_y1": 516.1,
"r_x2": 282.1,
"r_y2": 507.2,
"r_x3": 259.7,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "91.02",
"orig": "91.02",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 528.1,
"r_x1": 117.4,
"r_y1": 528.1,
"r_x2": 117.4,
"r_y2": 519.2,
"r_x3": 66.3,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 528.1,
"r_x1": 153.7,
"r_y1": 528.1,
"r_x2": 153.7,
"r_y2": 519.2,
"r_x3": 134.9,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 528.1,
"r_x1": 194.0,
"r_y1": 528.1,
"r_x2": 194.0,
"r_y2": 519.2,
"r_x3": 176.6,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "97.5",
"orig": "97.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 528.1,
"r_x1": 238.3,
"r_y1": 528.1,
"r_x2": 238.3,
"r_y2": 519.2,
"r_x3": 220.8,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "96.0",
"orig": "96.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 528.0,
"r_x1": 279.6,
"r_y1": 528.0,
"r_x2": 279.6,
"r_y2": 519.1,
"r_x3": 262.2,
"r_y3": 519.1,
"coord_origin": "TOPLEFT"
},
"text": "96.8",
"orig": "96.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 545.4,
"r_x1": 102.1,
"r_y1": 545.4,
"r_x2": 102.1,
"r_y2": 536.5,
"r_x3": 81.6,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.9,
"r_y0": 545.4,
"r_x1": 150.6,
"r_y1": 545.4,
"r_x2": 150.6,
"r_y2": 536.5,
"r_x3": 137.9,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 545.4,
"r_x1": 194.0,
"r_y1": 545.4,
"r_x2": 194.0,
"r_y2": 536.5,
"r_x3": 176.6,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 545.4,
"r_x1": 231.2,
"r_y1": 545.4,
"r_x2": 231.2,
"r_y2": 536.5,
"r_x3": 227.9,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 545.4,
"r_x1": 279.6,
"r_y1": 545.4,
"r_x2": 279.6,
"r_y2": 536.5,
"r_x3": 262.2,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 557.4,
"r_x1": 117.4,
"r_y1": 557.4,
"r_x2": 117.4,
"r_y2": 548.5,
"r_x3": 66.3,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.9,
"r_y0": 557.4,
"r_x1": 150.6,
"r_y1": 557.4,
"r_x2": 150.6,
"r_y2": 548.5,
"r_x3": 137.9,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 557.4,
"r_x1": 194.0,
"r_y1": 557.4,
"r_x2": 194.0,
"r_y2": 548.5,
"r_x3": 176.6,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 557.4,
"r_x1": 231.2,
"r_y1": 557.4,
"r_x2": 231.2,
"r_y2": 548.5,
"r_x3": 227.9,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 557.3,
"r_x1": 279.6,
"r_y1": 557.3,
"r_x2": 279.6,
"r_y2": 548.3,
"r_x3": 262.2,
"r_y3": 548.3,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 576.9,
"r_x1": 117.4,
"r_y1": 576.9,
"r_x2": 117.4,
"r_y2": 568.0,
"r_x3": 66.3,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 576.9,
"r_x1": 153.7,
"r_y1": 576.9,
"r_x2": 153.7,
"r_y2": 568.0,
"r_x3": 134.9,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "STN",
"orig": "STN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 576.9,
"r_x1": 194.0,
"r_y1": 576.9,
"r_x2": 194.0,
"r_y2": 568.0,
"r_x3": 176.6,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.9",
"orig": "96.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 576.9,
"r_x1": 238.3,
"r_y1": 576.9,
"r_x2": 238.3,
"r_y2": 568.0,
"r_x3": 220.8,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "95.7",
"orig": "95.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 576.9,
"r_x1": 279.6,
"r_y1": 576.9,
"r_x2": 279.6,
"r_y2": 568.0,
"r_x3": 262.2,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.7",
"orig": "96.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 27,
"label": "text",
"bbox": {
"l": 78.8,
"t": 420.7,
"r": 104.9,
"b": 429.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.8,
"r_y0": 429.6,
"r_x1": 104.9,
"r_y1": 429.6,
"r_x2": 104.9,
"r_y2": 420.7,
"r_x3": 78.8,
"r_y3": 420.7,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 28,
"label": "text",
"bbox": {
"l": 211.2,
"t": 414.7,
"r": 236.1,
"b": 423.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.2,
"r_y0": 423.6,
"r_x1": 236.1,
"r_y1": 423.6,
"r_x2": 236.1,
"r_y2": 414.7,
"r_x3": 211.2,
"r_y3": 414.7,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "text",
"bbox": {
"l": 129.3,
"t": 426.7,
"r": 159.2,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 129.3,
"r_y0": 435.6,
"r_x1": 159.2,
"r_y1": 435.6,
"r_x2": 159.2,
"r_y2": 426.7,
"r_x3": 129.3,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 30,
"label": "text",
"bbox": {
"l": 171.2,
"t": 426.7,
"r": 199.4,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.2,
"r_y0": 435.6,
"r_x1": 199.4,
"r_y1": 435.6,
"r_x2": 199.4,
"r_y2": 426.7,
"r_x3": 171.2,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "text",
"bbox": {
"l": 211.4,
"t": 426.7,
"r": 247.7,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.4,
"r_y0": 435.6,
"r_x1": 247.7,
"r_y1": 435.6,
"r_x2": 247.7,
"r_y2": 426.7,
"r_x3": 211.4,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 32,
"label": "text",
"bbox": {
"l": 264.5,
"t": 426.7,
"r": 277.3,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 264.5,
"r_y0": 435.6,
"r_x1": 277.3,
"r_y1": 435.6,
"r_x2": 277.3,
"r_y2": 426.7,
"r_x3": 264.5,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 33,
"label": "text",
"bbox": {
"l": 81.6,
"t": 443.6,
"r": 102.1,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 452.5,
"r_x1": 102.1,
"r_y1": 452.5,
"r_x2": 102.1,
"r_y2": 443.6,
"r_x3": 81.6,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 34,
"label": "text",
"bbox": {
"l": 134.9,
"t": 443.6,
"r": 153.7,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 452.5,
"r_x1": 153.7,
"r_y1": 452.5,
"r_x2": 153.7,
"r_y2": 443.6,
"r_x3": 134.9,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 35,
"label": "text",
"bbox": {
"l": 176.6,
"t": 443.6,
"r": 194.0,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 452.5,
"r_x1": 194.0,
"r_y1": 452.5,
"r_x2": 194.0,
"r_y2": 443.6,
"r_x3": 176.6,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "91.1",
"orig": "91.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 36,
"label": "text",
"bbox": {
"l": 220.8,
"t": 443.6,
"r": 238.3,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 452.5,
"r_x1": 238.3,
"r_y1": 452.5,
"r_x2": 238.3,
"r_y2": 443.6,
"r_x3": 220.8,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "88.7",
"orig": "88.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 37,
"label": "text",
"bbox": {
"l": 262.2,
"t": 443.6,
"r": 279.6,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 452.5,
"r_x1": 279.6,
"r_y1": 452.5,
"r_x2": 279.6,
"r_y2": 443.6,
"r_x3": 262.2,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "89.9",
"orig": "89.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 38,
"label": "text",
"bbox": {
"l": 82.2,
"t": 455.6,
"r": 101.5,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.2,
"r_y0": 464.5,
"r_x1": 101.5,
"r_y1": 464.5,
"r_x2": 101.5,
"r_y2": 455.6,
"r_x3": 82.2,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 39,
"label": "text",
"bbox": {
"l": 134.9,
"t": 455.6,
"r": 153.7,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 464.5,
"r_x1": 153.7,
"r_y1": 464.5,
"r_x2": 153.7,
"r_y2": 455.6,
"r_x3": 134.9,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 40,
"label": "text",
"bbox": {
"l": 183.6,
"t": 455.6,
"r": 186.9,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 464.5,
"r_x1": 186.9,
"r_y1": 464.5,
"r_x2": 186.9,
"r_y2": 455.6,
"r_x3": 183.6,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 227.9,
"t": 455.6,
"r": 231.2,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 464.5,
"r_x1": 231.2,
"r_y1": 464.5,
"r_x2": 231.2,
"r_y2": 455.6,
"r_x3": 227.9,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 259.7,
"t": 455.6,
"r": 282.1,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 464.5,
"r_x1": 282.1,
"r_y1": 464.5,
"r_x2": 282.1,
"r_y2": 455.6,
"r_x3": 259.7,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "93.01",
"orig": "93.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 66.3,
"t": 468.1,
"r": 117.4,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 477.0,
"r_x1": 117.4,
"r_y1": 477.0,
"r_x2": 117.4,
"r_y2": 468.1,
"r_x3": 66.3,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 134.9,
"t": 468.1,
"r": 153.7,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 477.0,
"r_x1": 153.7,
"r_y1": 477.0,
"r_x2": 153.7,
"r_y2": 468.1,
"r_x3": 134.9,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 176.6,
"t": 468.1,
"r": 194.0,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 477.0,
"r_x1": 194.0,
"r_y1": 477.0,
"r_x2": 194.0,
"r_y2": 468.1,
"r_x3": 176.6,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "98.5",
"orig": "98.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 220.8,
"t": 468.1,
"r": 238.3,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 477.0,
"r_x1": 238.3,
"r_y1": 477.0,
"r_x2": 238.3,
"r_y2": 468.1,
"r_x3": 220.8,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "95.0",
"orig": "95.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 259.7,
"t": 468.0,
"r": 282.1,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 477.0,
"r_x1": 282.1,
"r_y1": 477.0,
"r_x2": 282.1,
"r_y2": 468.0,
"r_x3": 259.7,
"r_y3": 468.0,
"coord_origin": "TOPLEFT"
},
"text": "96.75",
"orig": "96.75",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 81.6,
"t": 483.3,
"r": 102.1,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 492.2,
"r_x1": 102.1,
"r_y1": 492.2,
"r_x2": 102.1,
"r_y2": 483.3,
"r_x3": 81.6,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 134.9,
"t": 483.3,
"r": 153.7,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 492.2,
"r_x1": 153.7,
"r_y1": 492.2,
"r_x2": 153.7,
"r_y2": 483.3,
"r_x3": 134.9,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 176.6,
"t": 483.3,
"r": 194.0,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 492.2,
"r_x1": 194.0,
"r_y1": 492.2,
"r_x2": 194.0,
"r_y2": 483.3,
"r_x3": 176.6,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "88.4",
"orig": "88.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 51,
"label": "text",
"bbox": {
"l": 218.3,
"t": 483.3,
"r": 240.8,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.3,
"r_y0": 492.2,
"r_x1": 240.8,
"r_y1": 492.2,
"r_x2": 240.8,
"r_y2": 483.3,
"r_x3": 218.3,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "92.08",
"orig": "92.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 52,
"label": "text",
"bbox": {
"l": 262.2,
"t": 483.3,
"r": 279.6,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 492.2,
"r_x1": 279.6,
"r_y1": 492.2,
"r_x2": 279.6,
"r_y2": 483.3,
"r_x3": 262.2,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "90.6",
"orig": "90.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 53,
"label": "text",
"bbox": {
"l": 82.2,
"t": 495.3,
"r": 101.5,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.2,
"r_y0": 504.2,
"r_x1": 101.5,
"r_y1": 504.2,
"r_x2": 101.5,
"r_y2": 495.3,
"r_x3": 82.2,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 54,
"label": "text",
"bbox": {
"l": 134.9,
"t": 495.3,
"r": 153.7,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 504.2,
"r_x1": 153.7,
"r_y1": 504.2,
"r_x2": 153.7,
"r_y2": 495.3,
"r_x3": 134.9,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 55,
"label": "text",
"bbox": {
"l": 183.6,
"t": 495.3,
"r": 186.9,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 504.2,
"r_x1": 186.9,
"r_y1": 504.2,
"r_x2": 186.9,
"r_y2": 495.3,
"r_x3": 183.6,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 227.9,
"t": 495.3,
"r": 231.2,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 504.2,
"r_x1": 231.2,
"r_y1": 504.2,
"r_x2": 231.2,
"r_y2": 495.3,
"r_x3": 227.9,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 259.7,
"t": 495.3,
"r": 282.1,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 504.2,
"r_x1": 282.1,
"r_y1": 504.2,
"r_x2": 282.1,
"r_y2": 495.3,
"r_x3": 259.7,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "87.14",
"orig": "87.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 71.8,
"t": 507.2,
"r": 111.9,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.8,
"r_y0": 516.1,
"r_x1": 111.9,
"r_y1": 516.1,
"r_x2": 111.9,
"r_y2": 507.2,
"r_x3": 71.8,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "GTE (FT)",
"orig": "GTE (FT)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 134.9,
"t": 507.2,
"r": 153.7,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 516.1,
"r_x1": 153.7,
"r_y1": 516.1,
"r_x2": 153.7,
"r_y2": 507.2,
"r_x3": 134.9,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 183.6,
"t": 507.2,
"r": 186.9,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 516.1,
"r_x1": 186.9,
"r_y1": 516.1,
"r_x2": 186.9,
"r_y2": 507.2,
"r_x3": 183.6,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 227.9,
"t": 507.2,
"r": 231.2,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 516.1,
"r_x1": 231.2,
"r_y1": 516.1,
"r_x2": 231.2,
"r_y2": 507.2,
"r_x3": 227.9,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 259.7,
"t": 507.2,
"r": 282.1,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 516.1,
"r_x1": 282.1,
"r_y1": 516.1,
"r_x2": 282.1,
"r_y2": 507.2,
"r_x3": 259.7,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "91.02",
"orig": "91.02",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 66.3,
"t": 519.2,
"r": 117.4,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 528.1,
"r_x1": 117.4,
"r_y1": 528.1,
"r_x2": 117.4,
"r_y2": 519.2,
"r_x3": 66.3,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 134.9,
"t": 519.2,
"r": 153.7,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 528.1,
"r_x1": 153.7,
"r_y1": 528.1,
"r_x2": 153.7,
"r_y2": 519.2,
"r_x3": 134.9,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 176.6,
"t": 519.2,
"r": 194.0,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 528.1,
"r_x1": 194.0,
"r_y1": 528.1,
"r_x2": 194.0,
"r_y2": 519.2,
"r_x3": 176.6,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "97.5",
"orig": "97.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 220.8,
"t": 519.2,
"r": 238.3,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 528.1,
"r_x1": 238.3,
"r_y1": 528.1,
"r_x2": 238.3,
"r_y2": 519.2,
"r_x3": 220.8,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "96.0",
"orig": "96.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 262.2,
"t": 519.1,
"r": 279.6,
"b": 528.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 528.0,
"r_x1": 279.6,
"r_y1": 528.0,
"r_x2": 279.6,
"r_y2": 519.1,
"r_x3": 262.2,
"r_y3": 519.1,
"coord_origin": "TOPLEFT"
},
"text": "96.8",
"orig": "96.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 81.6,
"t": 536.5,
"r": 102.1,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 545.4,
"r_x1": 102.1,
"r_y1": 545.4,
"r_x2": 102.1,
"r_y2": 536.5,
"r_x3": 81.6,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 137.9,
"t": 536.5,
"r": 150.6,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.9,
"r_y0": 545.4,
"r_x1": 150.6,
"r_y1": 545.4,
"r_x2": 150.6,
"r_y2": 536.5,
"r_x3": 137.9,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 176.6,
"t": 536.5,
"r": 194.0,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 545.4,
"r_x1": 194.0,
"r_y1": 545.4,
"r_x2": 194.0,
"r_y2": 536.5,
"r_x3": 176.6,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 227.9,
"t": 536.5,
"r": 231.2,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 545.4,
"r_x1": 231.2,
"r_y1": 545.4,
"r_x2": 231.2,
"r_y2": 536.5,
"r_x3": 227.9,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 262.2,
"t": 536.5,
"r": 279.6,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 545.4,
"r_x1": 279.6,
"r_y1": 545.4,
"r_x2": 279.6,
"r_y2": 536.5,
"r_x3": 262.2,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 66.3,
"t": 548.5,
"r": 117.4,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 557.4,
"r_x1": 117.4,
"r_y1": 557.4,
"r_x2": 117.4,
"r_y2": 548.5,
"r_x3": 66.3,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 137.9,
"t": 548.5,
"r": 150.6,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.9,
"r_y0": 557.4,
"r_x1": 150.6,
"r_y1": 557.4,
"r_x2": 150.6,
"r_y2": 548.5,
"r_x3": 137.9,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 176.6,
"t": 548.5,
"r": 194.0,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 557.4,
"r_x1": 194.0,
"r_y1": 557.4,
"r_x2": 194.0,
"r_y2": 548.5,
"r_x3": 176.6,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 227.9,
"t": 548.5,
"r": 231.2,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 557.4,
"r_x1": 231.2,
"r_y1": 557.4,
"r_x2": 231.2,
"r_y2": 548.5,
"r_x3": 227.9,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 262.2,
"t": 548.3,
"r": 279.6,
"b": 557.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 557.3,
"r_x1": 279.6,
"r_y1": 557.3,
"r_x2": 279.6,
"r_y2": 548.3,
"r_x3": 262.2,
"r_y3": 548.3,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 66.3,
"t": 568.0,
"r": 117.4,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 576.9,
"r_x1": 117.4,
"r_y1": 576.9,
"r_x2": 117.4,
"r_y2": 568.0,
"r_x3": 66.3,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 134.9,
"t": 568.0,
"r": 153.7,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 576.9,
"r_x1": 153.7,
"r_y1": 576.9,
"r_x2": 153.7,
"r_y2": 568.0,
"r_x3": 134.9,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "STN",
"orig": "STN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 176.6,
"t": 568.0,
"r": 194.0,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 576.9,
"r_x1": 194.0,
"r_y1": 576.9,
"r_x2": 194.0,
"r_y2": 568.0,
"r_x3": 176.6,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.9",
"orig": "96.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 220.8,
"t": 568.0,
"r": 238.3,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 576.9,
"r_x1": 238.3,
"r_y1": 576.9,
"r_x2": 238.3,
"r_y2": 568.0,
"r_x3": 220.8,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "95.7",
"orig": "95.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 262.2,
"t": 568.0,
"r": 279.6,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 576.9,
"r_x1": 279.6,
"r_y1": 576.9,
"r_x2": 279.6,
"r_y2": 568.0,
"r_x3": 262.2,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.7",
"orig": "96.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 11,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 78.8,
"t": 420.7,
"r": 104.9,
"b": 429.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Model",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 211.2,
"t": 414.7,
"r": 236.1,
"b": 423.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "TEDS Complex",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 129.3,
"t": 426.7,
"r": 159.2,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Dataset",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 171.2,
"t": 426.7,
"r": 199.4,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "Simple",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 264.5,
"t": 426.7,
"r": 277.3,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "All",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 81.6,
"t": 443.6,
"r": 102.1,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 443.6,
"r": 153.7,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.6,
"t": 443.6,
"r": 194.0,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "91.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.8,
"t": 443.6,
"r": 238.3,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "88.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.2,
"t": 443.6,
"r": 279.6,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "89.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 82.2,
"t": 455.6,
"r": 101.5,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "GTE",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 455.6,
"r": 153.7,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 183.6,
"t": 455.6,
"r": 186.9,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.9,
"t": 455.6,
"r": 231.2,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.7,
"t": 455.6,
"r": 282.1,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "93.01",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.3,
"t": 468.1,
"r": 117.4,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 468.1,
"r": 153.7,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.6,
"t": 468.1,
"r": 194.0,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "98.5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.8,
"t": 468.1,
"r": 238.3,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "95.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.7,
"t": 468.0,
"r": 282.1,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "96.75",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 81.6,
"t": 483.3,
"r": 102.1,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 483.3,
"r": 153.7,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.6,
"t": 483.3,
"r": 194.0,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "88.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 218.3,
"t": 483.3,
"r": 240.8,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "92.08",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.2,
"t": 483.3,
"r": 279.6,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "90.6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 82.2,
"t": 495.3,
"r": 101.5,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "GTE",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 495.3,
"r": 153.7,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 183.6,
"t": 495.3,
"r": 186.9,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.9,
"t": 495.3,
"r": 231.2,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.7,
"t": 495.3,
"r": 282.1,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "87.14",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 71.8,
"t": 507.2,
"r": 111.9,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "GTE (FT)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 507.2,
"r": 153.7,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 183.6,
"t": 507.2,
"r": 186.9,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.9,
"t": 507.2,
"r": 231.2,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.7,
"t": 507.2,
"r": 282.1,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "91.02",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.3,
"t": 519.2,
"r": 117.4,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 519.2,
"r": 153.7,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.6,
"t": 519.2,
"r": 194.0,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "97.5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.8,
"t": 519.2,
"r": 238.3,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "96.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.2,
"t": 519.1,
"r": 279.6,
"b": 528.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "96.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 81.6,
"t": 536.5,
"r": 102.1,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 137.9,
"t": 536.5,
"r": 150.6,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "TB",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.6,
"t": 536.5,
"r": 194.0,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "86.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.9,
"t": 536.5,
"r": 231.2,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.2,
"t": 536.5,
"r": 279.6,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "86.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.3,
"t": 548.5,
"r": 117.4,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 137.9,
"t": 548.5,
"r": 150.6,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "TB",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.6,
"t": 548.5,
"r": 194.0,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "89.6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.9,
"t": 548.5,
"r": 231.2,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.2,
"t": 548.3,
"r": 279.6,
"b": 557.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "89.6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.3,
"t": 568.0,
"r": 117.4,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 568.0,
"r": 153.7,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "STN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.6,
"t": 568.0,
"r": 194.0,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "96.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.8,
"t": 568.0,
"r": 238.3,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "95.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.2,
"t": 568.0,
"r": 279.6,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "96.7",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "text",
"id": 15,
"page_no": 6,
"cluster": {
"id": 15,
"label": "text",
"bbox": {
"l": 50.1,
"t": 592.4,
"r": 286.4,
"b": 613.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.72,
"cells": [
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 601.3,
"r_x1": 286.4,
"r_y1": 601.3,
"r_x2": 286.4,
"r_y2": 592.4,
"r_x3": 50.1,
"r_y3": 592.4,
"coord_origin": "TOPLEFT"
},
"text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet",
"orig": "Table 2: Structure results on PubTabNet (PTN), FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 613.3,
"r_x1": 247.5,
"r_y1": 613.3,
"r_x2": 247.5,
"r_y2": 604.4,
"r_x3": 50.1,
"r_y3": 604.4,
"coord_origin": "TOPLEFT"
},
"text": "(FTN), TableBank (TB) and SynthTabNet (STN).",
"orig": "(FTN), TableBank (TB) and SynthTabNet (STN).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet (FTN), TableBank (TB) and SynthTabNet (STN)."
},
{
"label": "text",
"id": 16,
"page_no": 6,
"cluster": {
"id": 16,
"label": "text",
"bbox": {
"l": 50.1,
"t": 616.3,
"r": 261.8,
"b": 625.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.64,
"cells": [
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 625.2,
"r_x1": 261.8,
"r_y1": 625.2,
"r_x2": 261.8,
"r_y2": 616.3,
"r_x3": 50.1,
"r_y3": 616.3,
"coord_origin": "TOPLEFT"
},
"text": "FT: Model was trained on PubTabNet then finetuned.",
"orig": "FT: Model was trained on PubTabNet then finetuned.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "FT: Model was trained on PubTabNet then finetuned."
},
{
"label": "text",
"id": 3,
"page_no": 6,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 50.1,
"t": 644.3,
"r": 286.4,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 653.3,
"r_x1": 124.7,
"r_y1": 653.3,
"r_x2": 124.7,
"r_y2": 644.3,
"r_x3": 62.1,
"r_y3": 644.3,
"coord_origin": "TOPLEFT"
},
"text": "Cell Detection.",
"orig": "Cell Detection.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 128.2,
"r_y0": 653.4,
"r_x1": 242.9,
"r_y1": 653.4,
"r_x2": 242.9,
"r_y2": 644.5,
"r_x3": 128.2,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "Like any object detector, our",
"orig": "Like any object detector, our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 245.6,
"r_y0": 653.1,
"r_x1": 286.4,
"r_y1": 653.1,
"r_x2": 286.4,
"r_y2": 644.6,
"r_x3": 245.6,
"r_y3": 644.6,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox",
"orig": "Cell BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 665.1,
"r_x1": 85.0,
"r_y1": 665.1,
"r_x2": 85.0,
"r_y2": 656.5,
"r_x3": 50.1,
"r_y3": 656.5,
"coord_origin": "TOPLEFT"
},
"text": "Detector",
"orig": "Detector",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.5,
"r_y0": 665.3,
"r_x1": 286.4,
"r_y1": 665.3,
"r_x2": 286.4,
"r_y2": 656.4,
"r_x3": 89.5,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "provides bounding boxes that can be improved",
"orig": "provides bounding boxes that can be improved",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.3,
"r_x1": 286.4,
"r_y1": 677.3,
"r_x2": 286.4,
"r_y2": 668.4,
"r_x3": 50.1,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "with post-processing during inference. We make use of the",
"orig": "with post-processing during inference. We make use of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 689.2,
"r_x1": 286.4,
"r_y1": 689.2,
"r_x2": 286.4,
"r_y2": 680.3,
"r_x3": 50.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "grid-like structure of tables to refine the predictions. A de-",
"orig": "grid-like structure of tables to refine the predictions. A de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "tailed explanation on the post-processing is available in the",
"orig": "tailed explanation on the post-processing is available in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 286.4,
"r_y1": 713.2,
"r_x2": 286.4,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "supplementary material. As shown in Tab. 3, we evaluate",
"orig": "supplementary material. As shown in Tab. 3, we evaluate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Cell Detection. Like any object detector, our Cell BBox Detector provides bounding boxes that can be improved with post-processing during inference. We make use of the grid-like structure of tables to refine the predictions. A detailed explanation on the post-processing is available in the supplementary material. As shown in Tab. 3, we evaluate"
},
{
"label": "text",
"id": 7,
"page_no": 6,
"cluster": {
"id": 7,
"label": "text",
"bbox": {
"l": 308.9,
"t": 75.2,
"r": 545.1,
"b": 227.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 84.1,
"r_x1": 322.1,
"r_y1": 84.1,
"r_x2": 322.1,
"r_y2": 75.2,
"r_x3": 308.9,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "our",
"orig": "our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 325.5,
"r_y0": 83.9,
"r_x1": 404.6,
"r_y1": 83.9,
"r_x2": 404.6,
"r_y2": 75.3,
"r_x3": 325.5,
"r_y3": 75.3,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.1,
"r_y0": 84.1,
"r_x1": 545.1,
"r_y1": 84.1,
"r_x2": 545.1,
"r_y2": 75.2,
"r_x3": 408.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "accuracy for cells with a class la-",
"orig": "accuracy for cells with a class la-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 96.1,
"r_x1": 545.1,
"r_y1": 96.1,
"r_x2": 545.1,
"r_y2": 87.2,
"r_x3": 308.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric",
"orig": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 108.0,
"r_x1": 470.2,
"r_y1": 108.0,
"r_x2": 470.2,
"r_y2": 99.1,
"r_x3": 308.9,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "for pre-processing and post-processing.",
"orig": "for pre-processing and post-processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.5,
"r_y0": 108.0,
"r_x1": 545.1,
"r_y1": 108.0,
"r_x2": 545.1,
"r_y2": 99.1,
"r_x3": 477.5,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "Note that we do",
"orig": "Note that we do",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 120.0,
"r_x1": 545.1,
"r_y1": 120.0,
"r_x2": 545.1,
"r_y2": 111.1,
"r_x3": 308.9,
"r_y3": 111.1,
"coord_origin": "TOPLEFT"
},
"text": "not have post-processing results for SynthTabNet as images",
"orig": "not have post-processing results for SynthTabNet as images",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 131.9,
"r_x1": 545.1,
"r_y1": 131.9,
"r_x2": 545.1,
"r_y2": 123.0,
"r_x3": 308.9,
"r_y3": 123.0,
"coord_origin": "TOPLEFT"
},
"text": "are only provided. To compare the performance of our pro-",
"orig": "are only provided. To compare the performance of our pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 143.9,
"r_x1": 502.0,
"r_y1": 143.9,
"r_x2": 502.0,
"r_y2": 135.0,
"r_x3": 308.9,
"r_y3": 135.0,
"coord_origin": "TOPLEFT"
},
"text": "posed approach, we\u2019ve integrated TableFormer\u2019s",
"orig": "posed approach, we\u2019ve integrated TableFormer\u2019s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 504.5,
"r_y0": 143.7,
"r_x1": 545.1,
"r_y1": 143.7,
"r_x2": 545.1,
"r_y2": 135.1,
"r_x3": 504.5,
"r_y3": 135.1,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox",
"orig": "Cell BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 155.6,
"r_x1": 343.2,
"r_y1": 155.6,
"r_x2": 343.2,
"r_y2": 147.0,
"r_x3": 308.9,
"r_y3": 147.0,
"coord_origin": "TOPLEFT"
},
"text": "Decoder",
"orig": "Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.4,
"r_y0": 155.8,
"r_x1": 545.1,
"r_y1": 155.8,
"r_x2": 545.1,
"r_y2": 146.9,
"r_x3": 346.4,
"r_y3": 146.9,
"coord_origin": "TOPLEFT"
},
"text": "into EDD architecture. As mentioned previously,",
"orig": "into EDD architecture. As mentioned previously,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 167.8,
"r_x1": 446.2,
"r_y1": 167.8,
"r_x2": 446.2,
"r_y2": 158.9,
"r_x3": 308.9,
"r_y3": 158.9,
"coord_origin": "TOPLEFT"
},
"text": "the Structure Decoder provides the",
"orig": "the Structure Decoder provides the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.3,
"r_y0": 167.6,
"r_x1": 525.0,
"r_y1": 167.6,
"r_x2": 525.0,
"r_y2": 159.0,
"r_x3": 448.3,
"r_y3": 159.0,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 527.4,
"r_y0": 167.8,
"r_x1": 545.1,
"r_y1": 167.8,
"r_x2": 545.1,
"r_y2": 158.9,
"r_x3": 527.4,
"r_y3": 158.9,
"coord_origin": "TOPLEFT"
},
"text": "with",
"orig": "with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 179.8,
"r_x1": 545.1,
"r_y1": 179.8,
"r_x2": 545.1,
"r_y2": 170.8,
"r_x3": 308.9,
"r_y3": 170.8,
"coord_origin": "TOPLEFT"
},
"text": "the features needed to predict the bounding box predictions.",
"orig": "the features needed to predict the bounding box predictions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 191.7,
"r_x1": 432.9,
"r_y1": 191.7,
"r_x2": 432.9,
"r_y2": 182.8,
"r_x3": 308.9,
"r_y3": 182.8,
"coord_origin": "TOPLEFT"
},
"text": "Therefore, the accuracy of the",
"orig": "Therefore, the accuracy of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 436.4,
"r_y0": 191.5,
"r_x1": 510.9,
"r_y1": 191.5,
"r_x2": 510.9,
"r_y2": 182.9,
"r_x3": 436.4,
"r_y3": 182.9,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.7,
"r_y0": 191.7,
"r_x1": 545.1,
"r_y1": 191.7,
"r_x2": 545.1,
"r_y2": 182.8,
"r_x3": 514.7,
"r_y3": 182.8,
"coord_origin": "TOPLEFT"
},
"text": "directly",
"orig": "directly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 203.7,
"r_x1": 431.2,
"r_y1": 203.7,
"r_x2": 431.2,
"r_y2": 194.8,
"r_x3": 308.9,
"r_y3": 194.8,
"coord_origin": "TOPLEFT"
},
"text": "influences the accuracy of the",
"orig": "influences the accuracy of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 434.7,
"r_y0": 203.4,
"r_x1": 514.2,
"r_y1": 203.4,
"r_x2": 514.2,
"r_y2": 194.8,
"r_x3": 434.7,
"r_y3": 194.8,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.2,
"r_y0": 203.7,
"r_x1": 545.1,
"r_y1": 203.7,
"r_x2": 545.1,
"r_y2": 194.8,
"r_x3": 514.2,
"r_y3": 194.8,
"coord_origin": "TOPLEFT"
},
"text": ". If the",
"orig": ". If the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 215.4,
"r_x1": 382.4,
"r_y1": 215.4,
"r_x2": 382.4,
"r_y2": 206.8,
"r_x3": 308.9,
"r_y3": 206.8,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.1,
"r_y0": 215.6,
"r_x1": 545.1,
"r_y1": 215.6,
"r_x2": 545.1,
"r_y2": 206.7,
"r_x3": 385.1,
"r_y3": 206.7,
"coord_origin": "TOPLEFT"
},
"text": "predicts an extra column, this will result",
"orig": "predicts an extra column, this will result",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 227.6,
"r_x1": 501.7,
"r_y1": 227.6,
"r_x2": 501.7,
"r_y2": 218.7,
"r_x3": 308.9,
"r_y3": 218.7,
"coord_origin": "TOPLEFT"
},
"text": "in an extra column of predicted bounding boxes.",
"orig": "in an extra column of predicted bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "our Cell BBox Decoder accuracy for cells with a class label of 'content' only using the PASCAL VOC mAP metric for pre-processing and post-processing. Note that we do not have post-processing results for SynthTabNet as images are only provided. To compare the performance of our proposed approach, we've integrated TableFormer's Cell BBox Decoder into EDD architecture. As mentioned previously, the Structure Decoder provides the Cell BBox Decoder with the features needed to predict the bounding box predictions. Therefore, the accuracy of the Structure Decoder directly influences the accuracy of the Cell BBox Decoder . If the Structure Decoder predicts an extra column, this will result in an extra column of predicted bounding boxes."
},
{
"label": "table",
"id": 8,
"page_no": 6,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 308.4,
"t": 247.9,
"r": 533.6,
"b": 303.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.3,
"r_y0": 262.6,
"r_x1": 365.3,
"r_y1": 262.6,
"r_x2": 365.3,
"r_y2": 253.7,
"r_x3": 339.3,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 401.0,
"r_y0": 262.6,
"r_x1": 430.9,
"r_y1": 262.6,
"r_x2": 430.9,
"r_y2": 253.7,
"r_x3": 401.0,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 454.1,
"r_y0": 262.6,
"r_x1": 474.6,
"r_y1": 262.6,
"r_x2": 474.6,
"r_y2": 253.7,
"r_x3": 454.1,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "mAP",
"orig": "mAP",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 486.5,
"r_y0": 262.6,
"r_x1": 527.2,
"r_y1": 262.6,
"r_x2": 527.2,
"r_y2": 253.7,
"r_x3": 486.5,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "mAP (PP)",
"orig": "mAP (PP)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.7,
"r_y0": 279.5,
"r_x1": 377.0,
"r_y1": 279.5,
"r_x2": 377.0,
"r_y2": 270.6,
"r_x3": 327.7,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "EDD+BBox",
"orig": "EDD+BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 279.5,
"r_x1": 438.3,
"r_y1": 279.5,
"r_x2": 438.3,
"r_y2": 270.6,
"r_x3": 393.7,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 279.5,
"r_x1": 473.1,
"r_y1": 279.5,
"r_x2": 473.1,
"r_y2": 270.6,
"r_x3": 455.6,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "79.2",
"orig": "79.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.2,
"r_y0": 279.5,
"r_x1": 515.6,
"r_y1": 279.5,
"r_x2": 515.6,
"r_y2": 270.6,
"r_x3": 498.2,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "82.7",
"orig": "82.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 291.5,
"r_x1": 377.9,
"r_y1": 291.5,
"r_x2": 377.9,
"r_y2": 282.6,
"r_x3": 326.8,
"r_y3": 282.6,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 291.5,
"r_x1": 438.3,
"r_y1": 291.5,
"r_x2": 438.3,
"r_y2": 282.6,
"r_x3": 393.7,
"r_y3": 282.6,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 291.4,
"r_x1": 473.1,
"r_y1": 291.4,
"r_x2": 473.1,
"r_y2": 282.5,
"r_x3": 455.6,
"r_y3": 282.5,
"coord_origin": "TOPLEFT"
},
"text": "82.1",
"orig": "82.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.2,
"r_y0": 291.4,
"r_x1": 515.6,
"r_y1": 291.4,
"r_x2": 515.6,
"r_y2": 282.5,
"r_x3": 498.2,
"r_y3": 282.5,
"coord_origin": "TOPLEFT"
},
"text": "86.8",
"orig": "86.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 303.4,
"r_x1": 377.9,
"r_y1": 303.4,
"r_x2": 377.9,
"r_y2": 294.5,
"r_x3": 326.8,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.8,
"r_y0": 303.4,
"r_x1": 442.2,
"r_y1": 303.4,
"r_x2": 442.2,
"r_y2": 294.5,
"r_x3": 389.8,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 303.4,
"r_x1": 473.1,
"r_y1": 303.4,
"r_x2": 473.1,
"r_y2": 294.5,
"r_x3": 455.6,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "87.7",
"orig": "87.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 505.2,
"r_y0": 303.4,
"r_x1": 508.5,
"r_y1": 303.4,
"r_x2": 508.5,
"r_y2": 294.5,
"r_x3": 505.2,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 83,
"label": "text",
"bbox": {
"l": 339.3,
"t": 253.7,
"r": 365.3,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.3,
"r_y0": 262.6,
"r_x1": 365.3,
"r_y1": 262.6,
"r_x2": 365.3,
"r_y2": 253.7,
"r_x3": 339.3,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 401.0,
"t": 253.7,
"r": 430.9,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 401.0,
"r_y0": 262.6,
"r_x1": 430.9,
"r_y1": 262.6,
"r_x2": 430.9,
"r_y2": 253.7,
"r_x3": 401.0,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 454.1,
"t": 253.7,
"r": 474.6,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 454.1,
"r_y0": 262.6,
"r_x1": 474.6,
"r_y1": 262.6,
"r_x2": 474.6,
"r_y2": 253.7,
"r_x3": 454.1,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "mAP",
"orig": "mAP",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 486.5,
"t": 253.7,
"r": 527.2,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 486.5,
"r_y0": 262.6,
"r_x1": 527.2,
"r_y1": 262.6,
"r_x2": 527.2,
"r_y2": 253.7,
"r_x3": 486.5,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "mAP (PP)",
"orig": "mAP (PP)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 327.7,
"t": 270.6,
"r": 377.0,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.7,
"r_y0": 279.5,
"r_x1": 377.0,
"r_y1": 279.5,
"r_x2": 377.0,
"r_y2": 270.6,
"r_x3": 327.7,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "EDD+BBox",
"orig": "EDD+BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 393.7,
"t": 270.6,
"r": 438.3,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 279.5,
"r_x1": 438.3,
"r_y1": 279.5,
"r_x2": 438.3,
"r_y2": 270.6,
"r_x3": 393.7,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 455.6,
"t": 270.6,
"r": 473.1,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 279.5,
"r_x1": 473.1,
"r_y1": 279.5,
"r_x2": 473.1,
"r_y2": 270.6,
"r_x3": 455.6,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "79.2",
"orig": "79.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 498.2,
"t": 270.6,
"r": 515.6,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.2,
"r_y0": 279.5,
"r_x1": 515.6,
"r_y1": 279.5,
"r_x2": 515.6,
"r_y2": 270.6,
"r_x3": 498.2,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "82.7",
"orig": "82.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 326.8,
"t": 282.6,
"r": 377.9,
"b": 291.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 291.5,
"r_x1": 377.9,
"r_y1": 291.5,
"r_x2": 377.9,
"r_y2": 282.6,
"r_x3": 326.8,
"r_y3": 282.6,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 393.7,
"t": 282.6,
"r": 438.3,
"b": 291.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 291.5,
"r_x1": 438.3,
"r_y1": 291.5,
"r_x2": 438.3,
"r_y2": 282.6,
"r_x3": 393.7,
"r_y3": 282.6,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 455.6,
"t": 282.5,
"r": 473.1,
"b": 291.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 291.4,
"r_x1": 473.1,
"r_y1": 291.4,
"r_x2": 473.1,
"r_y2": 282.5,
"r_x3": 455.6,
"r_y3": 282.5,
"coord_origin": "TOPLEFT"
},
"text": "82.1",
"orig": "82.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 498.2,
"t": 282.5,
"r": 515.6,
"b": 291.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.2,
"r_y0": 291.4,
"r_x1": 515.6,
"r_y1": 291.4,
"r_x2": 515.6,
"r_y2": 282.5,
"r_x3": 498.2,
"r_y3": 282.5,
"coord_origin": "TOPLEFT"
},
"text": "86.8",
"orig": "86.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 326.8,
"t": 294.5,
"r": 377.9,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 303.4,
"r_x1": 377.9,
"r_y1": 303.4,
"r_x2": 377.9,
"r_y2": 294.5,
"r_x3": 326.8,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 389.8,
"t": 294.5,
"r": 442.2,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.8,
"r_y0": 303.4,
"r_x1": 442.2,
"r_y1": 303.4,
"r_x2": 442.2,
"r_y2": 294.5,
"r_x3": 389.8,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 455.6,
"t": 294.5,
"r": 473.1,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 303.4,
"r_x1": 473.1,
"r_y1": 303.4,
"r_x2": 473.1,
"r_y2": 294.5,
"r_x3": 455.6,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "87.7",
"orig": "87.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 505.2,
"t": 294.5,
"r": 508.5,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 505.2,
"r_y0": 303.4,
"r_x1": 508.5,
"r_y1": 303.4,
"r_x2": 508.5,
"r_y2": 294.5,
"r_x3": 505.2,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 4,
"num_cols": 4,
"table_cells": [
{
"bbox": {
"l": 339.3,
"t": 253.7,
"r": 365.3,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Model",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 401.0,
"t": 253.7,
"r": 430.9,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Dataset",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 454.1,
"t": 253.7,
"r": 474.6,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "mAP",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 486.5,
"t": 253.7,
"r": 527.2,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "mAP (PP)",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 327.7,
"t": 270.6,
"r": 377.0,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD+BBox",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 393.7,
"t": 270.6,
"r": 438.3,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PubTabNet",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 455.6,
"t": 270.6,
"r": 473.1,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "79.2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 498.2,
"t": 270.6,
"r": 515.6,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "82.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 326.8,
"t": 282.6,
"r": 377.9,
"b": 291.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 393.7,
"t": 282.6,
"r": 438.3,
"b": 291.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PubTabNet",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 455.6,
"t": 282.5,
"r": 473.1,
"b": 291.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "82.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 498.2,
"t": 282.5,
"r": 515.6,
"b": 291.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "86.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 326.8,
"t": 294.5,
"r": 377.9,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 389.8,
"t": 294.5,
"r": 442.2,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "SynthTabNet",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 455.6,
"t": 294.5,
"r": 473.1,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "87.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 505.2,
"t": 294.5,
"r": 508.5,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 12,
"page_no": 6,
"cluster": {
"id": 12,
"label": "caption",
"bbox": {
"l": 308.9,
"t": 316.4,
"r": 545.1,
"b": 337.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 325.4,
"r_x1": 341.5,
"r_y1": 325.4,
"r_x2": 341.5,
"r_y2": 316.4,
"r_x3": 308.9,
"r_y3": 316.4,
"coord_origin": "TOPLEFT"
},
"text": "Table 3:",
"orig": "Table 3:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.6,
"r_y0": 325.4,
"r_x1": 545.1,
"r_y1": 325.4,
"r_x2": 545.1,
"r_y2": 316.4,
"r_x3": 348.6,
"r_y3": 316.4,
"coord_origin": "TOPLEFT"
},
"text": "Cell Bounding Box detection results on PubTab-",
"orig": "Cell Bounding Box detection results on PubTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 337.3,
"r_x1": 475.0,
"r_y1": 337.3,
"r_x2": 475.0,
"r_y2": 328.4,
"r_x3": 308.9,
"r_y3": 328.4,
"coord_origin": "TOPLEFT"
},
"text": "Net, and FinTabNet. PP: Post-processing.",
"orig": "Net, and FinTabNet. PP: Post-processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Table 3: Cell Bounding Box detection results on PubTabNet, and FinTabNet. PP: Post-processing."
},
{
"label": "text",
"id": 4,
"page_no": 6,
"cluster": {
"id": 4,
"label": "text",
"bbox": {
"l": 308.9,
"t": 367.7,
"r": 545.1,
"b": 520.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 376.6,
"r_x1": 378.9,
"r_y1": 376.6,
"r_x2": 378.9,
"r_y2": 367.7,
"r_x3": 320.8,
"r_y3": 367.7,
"coord_origin": "TOPLEFT"
},
"text": "Cell Content.",
"orig": "Cell Content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 387.1,
"r_y0": 376.7,
"r_x1": 545.1,
"r_y1": 376.7,
"r_x2": 545.1,
"r_y2": 367.8,
"r_x3": 387.1,
"r_y3": 367.8,
"coord_origin": "TOPLEFT"
},
"text": "In this section, we evaluate the entire",
"orig": "In this section, we evaluate the entire",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 388.7,
"r_x1": 487.2,
"r_y1": 388.7,
"r_x2": 487.2,
"r_y2": 379.8,
"r_x3": 308.9,
"r_y3": 379.8,
"coord_origin": "TOPLEFT"
},
"text": "pipeline of recovering a table with content.",
"orig": "pipeline of recovering a table with content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 494.0,
"r_y0": 388.7,
"r_x1": 545.1,
"r_y1": 388.7,
"r_x2": 545.1,
"r_y2": 379.8,
"r_x3": 494.0,
"r_y3": 379.8,
"coord_origin": "TOPLEFT"
},
"text": "Here we put",
"orig": "Here we put",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 400.6,
"r_x1": 545.1,
"r_y1": 400.6,
"r_x2": 545.1,
"r_y2": 391.7,
"r_x3": 308.9,
"r_y3": 391.7,
"coord_origin": "TOPLEFT"
},
"text": "our approach to test by capitalizing on extracting content",
"orig": "our approach to test by capitalizing on extracting content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 412.6,
"r_x1": 545.1,
"r_y1": 412.6,
"r_x2": 545.1,
"r_y2": 403.7,
"r_x3": 308.9,
"r_y3": 403.7,
"coord_origin": "TOPLEFT"
},
"text": "from the PDF cells rather than decoding from images. Tab.",
"orig": "from the PDF cells rather than decoding from images. Tab.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 424.5,
"r_x1": 314.1,
"r_y1": 424.5,
"r_x2": 314.1,
"r_y2": 415.6,
"r_x3": 308.9,
"r_y3": 415.6,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.7,
"r_y0": 424.5,
"r_x1": 545.1,
"r_y1": 424.5,
"r_x2": 545.1,
"r_y2": 415.6,
"r_x3": 316.7,
"r_y3": 415.6,
"coord_origin": "TOPLEFT"
},
"text": "shows the TEDs score of HTML code representing the",
"orig": "shows the TEDs score of HTML code representing the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 436.5,
"r_x1": 545.1,
"r_y1": 436.5,
"r_x2": 545.1,
"r_y2": 427.6,
"r_x3": 308.9,
"r_y3": 427.6,
"coord_origin": "TOPLEFT"
},
"text": "structure of the table along with the content inserted in the",
"orig": "structure of the table along with the content inserted in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 448.4,
"r_x1": 545.1,
"r_y1": 448.4,
"r_x2": 545.1,
"r_y2": 439.5,
"r_x3": 308.9,
"r_y3": 439.5,
"coord_origin": "TOPLEFT"
},
"text": "data cell and compared with the ground-truth. Our method",
"orig": "data cell and compared with the ground-truth. Our method",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 460.4,
"r_x1": 350.2,
"r_y1": 460.4,
"r_x2": 350.2,
"r_y2": 451.5,
"r_x3": 308.9,
"r_y3": 451.5,
"coord_origin": "TOPLEFT"
},
"text": "achieved a",
"orig": "achieved a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.2,
"r_y0": 460.3,
"r_x1": 374.6,
"r_y1": 460.3,
"r_x2": 374.6,
"r_y2": 451.4,
"r_x3": 352.2,
"r_y3": 451.4,
"coord_origin": "TOPLEFT"
},
"text": "5.3%",
"orig": "5.3%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 376.5,
"r_y0": 460.4,
"r_x1": 545.1,
"r_y1": 460.4,
"r_x2": 545.1,
"r_y2": 451.5,
"r_x3": 376.5,
"r_y3": 451.5,
"coord_origin": "TOPLEFT"
},
"text": "increase over the state-of-the-art, and com-",
"orig": "increase over the state-of-the-art, and com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 472.3,
"r_x1": 545.1,
"r_y1": 472.3,
"r_x2": 545.1,
"r_y2": 463.4,
"r_x3": 308.9,
"r_y3": 463.4,
"coord_origin": "TOPLEFT"
},
"text": "mercial solutions. We believe our scores would be higher",
"orig": "mercial solutions. We believe our scores would be higher",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 484.3,
"r_x1": 545.1,
"r_y1": 484.3,
"r_x2": 545.1,
"r_y2": 475.4,
"r_x3": 308.9,
"r_y3": 475.4,
"coord_origin": "TOPLEFT"
},
"text": "if the HTML ground-truth matched the extracted PDF cell",
"orig": "if the HTML ground-truth matched the extracted PDF cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 496.3,
"r_x1": 545.1,
"r_y1": 496.3,
"r_x2": 545.1,
"r_y2": 487.4,
"r_x3": 308.9,
"r_y3": 487.4,
"coord_origin": "TOPLEFT"
},
"text": "content. Unfortunately, there are small discrepancies such",
"orig": "content. Unfortunately, there are small discrepancies such",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 508.2,
"r_x1": 545.1,
"r_y1": 508.2,
"r_x2": 545.1,
"r_y2": 499.3,
"r_x3": 308.9,
"r_y3": 499.3,
"coord_origin": "TOPLEFT"
},
"text": "as spacings around words or special characters with various",
"orig": "as spacings around words or special characters with various",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 520.2,
"r_x1": 405.7,
"r_y1": 520.2,
"r_x2": 405.7,
"r_y2": 511.3,
"r_x3": 308.9,
"r_y3": 511.3,
"coord_origin": "TOPLEFT"
},
"text": "unicode representations.",
"orig": "unicode representations.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Cell Content. In this section, we evaluate the entire pipeline of recovering a table with content. Here we put our approach to test by capitalizing on extracting content from the PDF cells rather than decoding from images. Tab. 4 shows the TEDs score of HTML code representing the structure of the table along with the content inserted in the data cell and compared with the ground-truth. Our method achieved a 5.3% increase over the state-of-the-art, and commercial solutions. We believe our scores would be higher if the HTML ground-truth matched the extracted PDF cell content. Unfortunately, there are small discrepancies such as spacings around words or special characters with various unicode representations."
},
{
"label": "table",
"id": 5,
"page_no": 6,
"cluster": {
"id": 5,
"label": "table",
"bbox": {
"l": 333.0,
"t": 540.3,
"r": 520.9,
"b": 643.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 358.0,
"r_y0": 561.1,
"r_x1": 384.0,
"r_y1": 561.1,
"r_x2": 384.0,
"r_y2": 552.2,
"r_x3": 358.0,
"r_y3": 552.2,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.0,
"r_y0": 555.2,
"r_x1": 473.9,
"r_y1": 555.2,
"r_x2": 473.9,
"r_y2": 546.3,
"r_x3": 449.0,
"r_y3": 546.3,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.5,
"r_y0": 567.1,
"r_x1": 436.7,
"r_y1": 567.1,
"r_x2": 436.7,
"r_y2": 558.2,
"r_x3": 408.5,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.7,
"r_y0": 567.1,
"r_x1": 485.1,
"r_y1": 567.1,
"r_x2": 485.1,
"r_y2": 558.2,
"r_x3": 448.7,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.4,
"r_y0": 567.1,
"r_x1": 512.1,
"r_y1": 567.1,
"r_x2": 512.1,
"r_y2": 558.2,
"r_x3": 499.4,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.7,
"r_y0": 584.1,
"r_x1": 384.4,
"r_y1": 584.1,
"r_x2": 384.4,
"r_y2": 575.2,
"r_x3": 357.7,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "Tabula",
"orig": "Tabula",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 584.1,
"r_x1": 431.3,
"r_y1": 584.1,
"r_x2": 431.3,
"r_y2": 575.2,
"r_x3": 413.9,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "78.0",
"orig": "78.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 584.1,
"r_x1": 475.6,
"r_y1": 584.1,
"r_x2": 475.6,
"r_y2": 575.2,
"r_x3": 458.2,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "57.8",
"orig": "57.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 584.1,
"r_x1": 514.5,
"r_y1": 584.1,
"r_x2": 514.5,
"r_y2": 575.2,
"r_x3": 497.0,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "67.9",
"orig": "67.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 350.7,
"r_y0": 596.0,
"r_x1": 391.3,
"r_y1": 596.0,
"r_x2": 391.3,
"r_y2": 587.1,
"r_x3": 350.7,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "Traprange",
"orig": "Traprange",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 596.0,
"r_x1": 431.3,
"r_y1": 596.0,
"r_x2": 431.3,
"r_y2": 587.1,
"r_x3": 413.9,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "60.8",
"orig": "60.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 596.0,
"r_x1": 475.6,
"r_y1": 596.0,
"r_x2": 475.6,
"r_y2": 587.1,
"r_x3": 458.2,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "49.9",
"orig": "49.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 596.0,
"r_x1": 514.5,
"r_y1": 596.0,
"r_x2": 514.5,
"r_y2": 587.1,
"r_x3": 497.0,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "55.4",
"orig": "55.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.1,
"r_y0": 608.0,
"r_x1": 387.9,
"r_y1": 608.0,
"r_x2": 387.9,
"r_y2": 599.1,
"r_x3": 354.1,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "Camelot",
"orig": "Camelot",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 608.0,
"r_x1": 431.3,
"r_y1": 608.0,
"r_x2": 431.3,
"r_y2": 599.1,
"r_x3": 413.9,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "80.0",
"orig": "80.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 608.0,
"r_x1": 475.6,
"r_y1": 608.0,
"r_x2": 475.6,
"r_y2": 599.1,
"r_x3": 458.2,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "66.0",
"orig": "66.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 608.0,
"r_x1": 514.5,
"r_y1": 608.0,
"r_x2": 514.5,
"r_y2": 599.1,
"r_x3": 497.0,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "73.0",
"orig": "73.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.6,
"r_y0": 619.9,
"r_x1": 395.5,
"r_y1": 619.9,
"r_x2": 395.5,
"r_y2": 611.0,
"r_x3": 346.6,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "Acrobat Pro",
"orig": "Acrobat Pro",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 619.9,
"r_x1": 431.3,
"r_y1": 619.9,
"r_x2": 431.3,
"r_y2": 611.0,
"r_x3": 413.9,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "68.9",
"orig": "68.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 619.9,
"r_x1": 475.6,
"r_y1": 619.9,
"r_x2": 475.6,
"r_y2": 611.0,
"r_x3": 458.2,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "61.8",
"orig": "61.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 619.9,
"r_x1": 514.5,
"r_y1": 619.9,
"r_x2": 514.5,
"r_y2": 611.0,
"r_x3": 497.0,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "65.3",
"orig": "65.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.8,
"r_y0": 631.9,
"r_x1": 381.3,
"r_y1": 631.9,
"r_x2": 381.3,
"r_y2": 623.0,
"r_x3": 360.8,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 631.9,
"r_x1": 431.3,
"r_y1": 631.9,
"r_x2": 431.3,
"r_y2": 623.0,
"r_x3": 413.9,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "91.2",
"orig": "91.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 631.9,
"r_x1": 475.6,
"r_y1": 631.9,
"r_x2": 475.6,
"r_y2": 623.0,
"r_x3": 458.2,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "85.4",
"orig": "85.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 631.9,
"r_x1": 514.5,
"r_y1": 631.9,
"r_x2": 514.5,
"r_y2": 623.0,
"r_x3": 497.0,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "88.3",
"orig": "88.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.5,
"r_y0": 643.8,
"r_x1": 396.6,
"r_y1": 643.8,
"r_x2": 396.6,
"r_y2": 634.9,
"r_x3": 345.5,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 643.8,
"r_x1": 431.3,
"r_y1": 643.8,
"r_x2": 431.3,
"r_y2": 634.9,
"r_x3": 413.9,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "95.4",
"orig": "95.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 643.8,
"r_x1": 475.6,
"r_y1": 643.8,
"r_x2": 475.6,
"r_y2": 634.9,
"r_x3": 458.2,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "90.1",
"orig": "90.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 643.8,
"r_x1": 514.5,
"r_y1": 643.8,
"r_x2": 514.5,
"r_y2": 634.8,
"r_x3": 497.0,
"r_y3": 634.8,
"coord_origin": "TOPLEFT"
},
"text": "93.6",
"orig": "93.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 99,
"label": "text",
"bbox": {
"l": 358.0,
"t": 552.2,
"r": 384.0,
"b": 561.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 358.0,
"r_y0": 561.1,
"r_x1": 384.0,
"r_y1": 561.1,
"r_x2": 384.0,
"r_y2": 552.2,
"r_x3": 358.0,
"r_y3": 552.2,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 449.0,
"t": 546.3,
"r": 473.9,
"b": 555.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.0,
"r_y0": 555.2,
"r_x1": 473.9,
"r_y1": 555.2,
"r_x2": 473.9,
"r_y2": 546.3,
"r_x3": 449.0,
"r_y3": 546.3,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 408.5,
"t": 558.2,
"r": 436.7,
"b": 567.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.5,
"r_y0": 567.1,
"r_x1": 436.7,
"r_y1": 567.1,
"r_x2": 436.7,
"r_y2": 558.2,
"r_x3": 408.5,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 448.7,
"t": 558.2,
"r": 485.1,
"b": 567.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.7,
"r_y0": 567.1,
"r_x1": 485.1,
"r_y1": 567.1,
"r_x2": 485.1,
"r_y2": 558.2,
"r_x3": 448.7,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 499.4,
"t": 558.2,
"r": 512.1,
"b": 567.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.4,
"r_y0": 567.1,
"r_x1": 512.1,
"r_y1": 567.1,
"r_x2": 512.1,
"r_y2": 558.2,
"r_x3": 499.4,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 357.7,
"t": 575.2,
"r": 384.4,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.7,
"r_y0": 584.1,
"r_x1": 384.4,
"r_y1": 584.1,
"r_x2": 384.4,
"r_y2": 575.2,
"r_x3": 357.7,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "Tabula",
"orig": "Tabula",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 105,
"label": "text",
"bbox": {
"l": 413.9,
"t": 575.2,
"r": 431.3,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 584.1,
"r_x1": 431.3,
"r_y1": 584.1,
"r_x2": 431.3,
"r_y2": 575.2,
"r_x3": 413.9,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "78.0",
"orig": "78.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 106,
"label": "text",
"bbox": {
"l": 458.2,
"t": 575.2,
"r": 475.6,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 584.1,
"r_x1": 475.6,
"r_y1": 584.1,
"r_x2": 475.6,
"r_y2": 575.2,
"r_x3": 458.2,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "57.8",
"orig": "57.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 107,
"label": "text",
"bbox": {
"l": 497.0,
"t": 575.2,
"r": 514.5,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 584.1,
"r_x1": 514.5,
"r_y1": 584.1,
"r_x2": 514.5,
"r_y2": 575.2,
"r_x3": 497.0,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "67.9",
"orig": "67.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 108,
"label": "text",
"bbox": {
"l": 350.7,
"t": 587.1,
"r": 391.3,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 350.7,
"r_y0": 596.0,
"r_x1": 391.3,
"r_y1": 596.0,
"r_x2": 391.3,
"r_y2": 587.1,
"r_x3": 350.7,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "Traprange",
"orig": "Traprange",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 109,
"label": "text",
"bbox": {
"l": 413.9,
"t": 587.1,
"r": 431.3,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 596.0,
"r_x1": 431.3,
"r_y1": 596.0,
"r_x2": 431.3,
"r_y2": 587.1,
"r_x3": 413.9,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "60.8",
"orig": "60.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 110,
"label": "text",
"bbox": {
"l": 458.2,
"t": 587.1,
"r": 475.6,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 596.0,
"r_x1": 475.6,
"r_y1": 596.0,
"r_x2": 475.6,
"r_y2": 587.1,
"r_x3": 458.2,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "49.9",
"orig": "49.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 111,
"label": "text",
"bbox": {
"l": 497.0,
"t": 587.1,
"r": 514.5,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 596.0,
"r_x1": 514.5,
"r_y1": 596.0,
"r_x2": 514.5,
"r_y2": 587.1,
"r_x3": 497.0,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "55.4",
"orig": "55.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 112,
"label": "text",
"bbox": {
"l": 354.1,
"t": 599.1,
"r": 387.9,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.1,
"r_y0": 608.0,
"r_x1": 387.9,
"r_y1": 608.0,
"r_x2": 387.9,
"r_y2": 599.1,
"r_x3": 354.1,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "Camelot",
"orig": "Camelot",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 113,
"label": "text",
"bbox": {
"l": 413.9,
"t": 599.1,
"r": 431.3,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 608.0,
"r_x1": 431.3,
"r_y1": 608.0,
"r_x2": 431.3,
"r_y2": 599.1,
"r_x3": 413.9,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "80.0",
"orig": "80.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 114,
"label": "text",
"bbox": {
"l": 458.2,
"t": 599.1,
"r": 475.6,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 608.0,
"r_x1": 475.6,
"r_y1": 608.0,
"r_x2": 475.6,
"r_y2": 599.1,
"r_x3": 458.2,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "66.0",
"orig": "66.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 115,
"label": "text",
"bbox": {
"l": 497.0,
"t": 599.1,
"r": 514.5,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 608.0,
"r_x1": 514.5,
"r_y1": 608.0,
"r_x2": 514.5,
"r_y2": 599.1,
"r_x3": 497.0,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "73.0",
"orig": "73.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 116,
"label": "text",
"bbox": {
"l": 346.6,
"t": 611.0,
"r": 395.5,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.6,
"r_y0": 619.9,
"r_x1": 395.5,
"r_y1": 619.9,
"r_x2": 395.5,
"r_y2": 611.0,
"r_x3": 346.6,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "Acrobat Pro",
"orig": "Acrobat Pro",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 117,
"label": "text",
"bbox": {
"l": 413.9,
"t": 611.0,
"r": 431.3,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 619.9,
"r_x1": 431.3,
"r_y1": 619.9,
"r_x2": 431.3,
"r_y2": 611.0,
"r_x3": 413.9,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "68.9",
"orig": "68.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 118,
"label": "text",
"bbox": {
"l": 458.2,
"t": 611.0,
"r": 475.6,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 619.9,
"r_x1": 475.6,
"r_y1": 619.9,
"r_x2": 475.6,
"r_y2": 611.0,
"r_x3": 458.2,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "61.8",
"orig": "61.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 119,
"label": "text",
"bbox": {
"l": 497.0,
"t": 611.0,
"r": 514.5,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 619.9,
"r_x1": 514.5,
"r_y1": 619.9,
"r_x2": 514.5,
"r_y2": 611.0,
"r_x3": 497.0,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "65.3",
"orig": "65.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 120,
"label": "text",
"bbox": {
"l": 360.8,
"t": 623.0,
"r": 381.3,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.8,
"r_y0": 631.9,
"r_x1": 381.3,
"r_y1": 631.9,
"r_x2": 381.3,
"r_y2": 623.0,
"r_x3": 360.8,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 121,
"label": "text",
"bbox": {
"l": 413.9,
"t": 623.0,
"r": 431.3,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 631.9,
"r_x1": 431.3,
"r_y1": 631.9,
"r_x2": 431.3,
"r_y2": 623.0,
"r_x3": 413.9,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "91.2",
"orig": "91.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 122,
"label": "text",
"bbox": {
"l": 458.2,
"t": 623.0,
"r": 475.6,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 631.9,
"r_x1": 475.6,
"r_y1": 631.9,
"r_x2": 475.6,
"r_y2": 623.0,
"r_x3": 458.2,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "85.4",
"orig": "85.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 123,
"label": "text",
"bbox": {
"l": 497.0,
"t": 623.0,
"r": 514.5,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 631.9,
"r_x1": 514.5,
"r_y1": 631.9,
"r_x2": 514.5,
"r_y2": 623.0,
"r_x3": 497.0,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "88.3",
"orig": "88.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 124,
"label": "text",
"bbox": {
"l": 345.5,
"t": 634.9,
"r": 396.6,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.5,
"r_y0": 643.8,
"r_x1": 396.6,
"r_y1": 643.8,
"r_x2": 396.6,
"r_y2": 634.9,
"r_x3": 345.5,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 125,
"label": "text",
"bbox": {
"l": 413.9,
"t": 634.9,
"r": 431.3,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 643.8,
"r_x1": 431.3,
"r_y1": 643.8,
"r_x2": 431.3,
"r_y2": 634.9,
"r_x3": 413.9,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "95.4",
"orig": "95.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 126,
"label": "text",
"bbox": {
"l": 458.2,
"t": 634.9,
"r": 475.6,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 643.8,
"r_x1": 475.6,
"r_y1": 643.8,
"r_x2": 475.6,
"r_y2": 634.9,
"r_x3": 458.2,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "90.1",
"orig": "90.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 127,
"label": "text",
"bbox": {
"l": 497.0,
"t": 634.8,
"r": 514.5,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 643.8,
"r_x1": 514.5,
"r_y1": 643.8,
"r_x2": 514.5,
"r_y2": 634.8,
"r_x3": 497.0,
"r_y3": 634.8,
"coord_origin": "TOPLEFT"
},
"text": "93.6",
"orig": "93.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"fcel",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 7,
"num_cols": 4,
"table_cells": [
{
"bbox": {
"l": 358.0,
"t": 552.2,
"r": 384.0,
"b": 561.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Model",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.0,
"t": 546.3,
"r": 473.9,
"b": 555.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "TEDS Complex",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 408.5,
"t": 558.2,
"r": 436.7,
"b": 567.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Simple",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 499.4,
"t": 558.2,
"r": 512.1,
"b": 567.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "All",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 357.7,
"t": 575.2,
"r": 384.4,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Tabula",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 575.2,
"r": 431.3,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "78.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.2,
"t": 575.2,
"r": 475.6,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "57.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.0,
"t": 575.2,
"r": 514.5,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "67.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 350.7,
"t": 587.1,
"r": 391.3,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Traprange",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 587.1,
"r": 431.3,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "60.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.2,
"t": 587.1,
"r": 475.6,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "49.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.0,
"t": 587.1,
"r": 514.5,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "55.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 354.1,
"t": 599.1,
"r": 387.9,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Camelot",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 599.1,
"r": 431.3,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "80.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.2,
"t": 599.1,
"r": 475.6,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "66.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.0,
"t": 599.1,
"r": 514.5,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "73.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 346.6,
"t": 611.0,
"r": 395.5,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Acrobat Pro",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 611.0,
"r": 431.3,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "68.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.2,
"t": 611.0,
"r": 475.6,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "61.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.0,
"t": 611.0,
"r": 514.5,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "65.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 360.8,
"t": 623.0,
"r": 381.3,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 623.0,
"r": 431.3,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "91.2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.2,
"t": 623.0,
"r": 475.6,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "85.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.0,
"t": 623.0,
"r": 514.5,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "88.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 345.5,
"t": 634.9,
"r": 396.6,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 634.9,
"r": 431.3,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "95.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.2,
"t": 634.9,
"r": 475.6,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "90.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.0,
"t": 634.8,
"r": 514.5,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "93.6",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 11,
"page_no": 6,
"cluster": {
"id": 11,
"label": "caption",
"bbox": {
"l": 308.9,
"t": 656.9,
"r": 545.1,
"b": 689.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 212,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 665.8,
"r_x1": 341.7,
"r_y1": 665.8,
"r_x2": 341.7,
"r_y2": 656.9,
"r_x3": 308.9,
"r_y3": 656.9,
"coord_origin": "TOPLEFT"
},
"text": "Table 4:",
"orig": "Table 4:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 213,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 349.6,
"r_y0": 665.8,
"r_x1": 545.1,
"r_y1": 665.8,
"r_x2": 545.1,
"r_y2": 656.9,
"r_x3": 349.6,
"r_y3": 656.9,
"coord_origin": "TOPLEFT"
},
"text": "Results of structure with content retrieved using",
"orig": "Results of structure with content retrieved using",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 214,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 677.7,
"r_x1": 545.1,
"r_y1": 677.7,
"r_x2": 545.1,
"r_y2": 668.8,
"r_x3": 308.9,
"r_y3": 668.8,
"coord_origin": "TOPLEFT"
},
"text": "cell detection on PubTabNet. In all cases the input is PDF",
"orig": "cell detection on PubTabNet. In all cases the input is PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 215,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 689.7,
"r_x1": 435.0,
"r_y1": 689.7,
"r_x2": 435.0,
"r_y2": 680.8,
"r_x3": 308.9,
"r_y3": 680.8,
"coord_origin": "TOPLEFT"
},
"text": "documents with cropped tables.",
"orig": "documents with cropped tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Table 4: Results of structure with content retrieved using cell detection on PubTabNet. In all cases the input is PDF documents with cropped tables."
},
{
"label": "page_footer",
"id": 14,
"page_no": 6,
"cluster": {
"id": 14,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 216,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "7"
}
],
"body": [
{
"label": "section_header",
"id": 10,
"page_no": 6,
"cluster": {
"id": 10,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 74.4,
"r": 167.9,
"b": 84.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.3,
"r_x1": 63.7,
"r_y1": 84.3,
"r_x2": 63.7,
"r_y2": 74.4,
"r_x3": 50.1,
"r_y3": 74.4,
"coord_origin": "TOPLEFT"
},
"text": "5.3.",
"orig": "5.3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 72.8,
"r_y0": 84.3,
"r_x1": 167.9,
"r_y1": 84.3,
"r_x2": 167.9,
"r_y2": 74.4,
"r_x3": 72.8,
"r_y3": 74.4,
"coord_origin": "TOPLEFT"
},
"text": "Datasets and Metrics",
"orig": "Datasets and Metrics",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5.3. Datasets and Metrics"
},
{
"label": "text",
"id": 1,
"page_no": 6,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.1,
"t": 93.4,
"r": 286.4,
"b": 138.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 102.3,
"r_x1": 286.4,
"r_y1": 102.3,
"r_x2": 286.4,
"r_y2": 93.4,
"r_x3": 62.1,
"r_y3": 93.4,
"coord_origin": "TOPLEFT"
},
"text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-",
"orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 114.2,
"r_x1": 286.4,
"r_y1": 114.2,
"r_x2": 286.4,
"r_y2": 105.3,
"r_x3": 50.1,
"r_y3": 105.3,
"coord_origin": "TOPLEFT"
},
"text": "ric was introduced in [37]. It represents the prediction, and",
"orig": "ric was introduced in [37]. It represents the prediction, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 126.2,
"r_x1": 286.4,
"r_y1": 126.2,
"r_x2": 286.4,
"r_y2": 117.3,
"r_x3": 50.1,
"r_y3": 117.3,
"coord_origin": "TOPLEFT"
},
"text": "ground-truth as a tree structure of HTML tags. This simi-",
"orig": "ground-truth as a tree structure of HTML tags. This simi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 138.1,
"r_x1": 136.7,
"r_y1": 138.1,
"r_x2": 136.7,
"r_y2": 129.2,
"r_x3": 50.1,
"r_y3": 129.2,
"coord_origin": "TOPLEFT"
},
"text": "larity is calculated as:",
"orig": "larity is calculated as:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The Tree-Edit-Distance-Based Similarity (TEDS) metric was introduced in [37]. It represents the prediction, and ground-truth as a tree structure of HTML tags. This similarity is calculated as:"
},
{
"label": "formula",
"id": 13,
"page_no": 6,
"cluster": {
"id": 13,
"label": "formula",
"bbox": {
"l": 86.2,
"t": 150.3,
"r": 286.4,
"b": 172.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.2,
"r_y0": 165.9,
"r_x1": 118.9,
"r_y1": 165.9,
"r_x2": 118.9,
"r_y2": 157.1,
"r_x3": 86.2,
"r_y3": 157.1,
"coord_origin": "TOPLEFT"
},
"text": "TEDS (",
"orig": "TEDS (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 118.9,
"r_y0": 165.9,
"r_x1": 143.3,
"r_y1": 165.9,
"r_x2": 143.3,
"r_y2": 157.1,
"r_x3": 118.9,
"r_y3": 157.1,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$, T$_{b}$",
"orig": "T$_{a}$, T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.8,
"r_y0": 165.9,
"r_x1": 165.9,
"r_y1": 165.9,
"r_x2": 165.9,
"r_y2": 157.1,
"r_x3": 143.8,
"r_y3": 157.1,
"coord_origin": "TOPLEFT"
},
"text": ") = 1",
"orig": ") = 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 168.1,
"r_y0": 165.9,
"r_x1": 175.9,
"r_y1": 165.9,
"r_x2": 175.9,
"r_y2": 156.5,
"r_x3": 168.1,
"r_y3": 156.5,
"coord_origin": "TOPLEFT"
},
"text": "\u2212",
"orig": "\u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 179.3,
"r_y0": 159.2,
"r_x1": 222.0,
"r_y1": 159.2,
"r_x2": 222.0,
"r_y2": 150.3,
"r_x3": 179.3,
"r_y3": 150.3,
"coord_origin": "TOPLEFT"
},
"text": "EditDist (",
"orig": "EditDist (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 222.0,
"r_y0": 159.2,
"r_x1": 246.3,
"r_y1": 159.2,
"r_x2": 246.3,
"r_y2": 150.3,
"r_x3": 222.0,
"r_y3": 150.3,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$, T$_{b}$",
"orig": "T$_{a}$, T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.8,
"r_y0": 159.2,
"r_x1": 250.7,
"r_y1": 159.2,
"r_x2": 250.7,
"r_y2": 150.3,
"r_x3": 246.8,
"r_y3": 150.3,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.2,
"r_y0": 172.7,
"r_x1": 206.3,
"r_y1": 172.7,
"r_x2": 206.3,
"r_y2": 163.9,
"r_x3": 182.2,
"r_y3": 163.9,
"coord_origin": "TOPLEFT"
},
"text": "max (",
"orig": "max (",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.3,
"r_y0": 172.7,
"r_x1": 209.1,
"r_y1": 172.7,
"r_x2": 209.1,
"r_y2": 163.3,
"r_x3": 206.3,
"r_y3": 163.3,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.1,
"r_y0": 172.7,
"r_x1": 219.2,
"r_y1": 172.7,
"r_x2": 219.2,
"r_y2": 163.9,
"r_x3": 209.1,
"r_y3": 163.9,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$",
"orig": "T$_{a}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 219.7,
"r_y0": 172.7,
"r_x1": 222.5,
"r_y1": 172.7,
"r_x2": 222.5,
"r_y2": 163.3,
"r_x3": 219.7,
"r_y3": 163.3,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 224.1,
"r_y0": 172.7,
"r_x1": 226.9,
"r_y1": 172.7,
"r_x2": 226.9,
"r_y2": 163.9,
"r_x3": 224.1,
"r_y3": 163.9,
"coord_origin": "TOPLEFT"
},
"text": ",",
"orig": ",",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 228.6,
"r_y0": 172.7,
"r_x1": 231.3,
"r_y1": 172.7,
"r_x2": 231.3,
"r_y2": 163.3,
"r_x3": 228.6,
"r_y3": 163.3,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 231.3,
"r_y0": 172.7,
"r_x1": 240.6,
"r_y1": 172.7,
"r_x2": 240.6,
"r_y2": 163.9,
"r_x3": 231.3,
"r_y3": 163.9,
"coord_origin": "TOPLEFT"
},
"text": "T$_{b}$",
"orig": "T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 241.1,
"r_y0": 172.7,
"r_x1": 243.9,
"r_y1": 172.7,
"r_x2": 243.9,
"r_y2": 163.3,
"r_x3": 241.1,
"r_y3": 163.3,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 243.9,
"r_y0": 172.7,
"r_x1": 247.8,
"r_y1": 172.7,
"r_x2": 247.8,
"r_y2": 163.9,
"r_x3": 243.9,
"r_y3": 163.9,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.7,
"r_y0": 166.1,
"r_x1": 286.4,
"r_y1": 166.1,
"r_x2": 286.4,
"r_y2": 157.2,
"r_x3": 274.7,
"r_y3": 157.2,
"coord_origin": "TOPLEFT"
},
"text": "(3)",
"orig": "(3)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TEDS ( T$_{a}$, T$_{b}$ ) = 1 \u2212 EditDist ( T$_{a}$, T$_{b}$ ) max ( | T$_{a}$ | , | T$_{b}$ | ) (3)"
},
{
"label": "text",
"id": 6,
"page_no": 6,
"cluster": {
"id": 6,
"label": "text",
"bbox": {
"l": 50.1,
"t": 181.0,
"r": 286.4,
"b": 214.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 190.1,
"r_x1": 86.4,
"r_y1": 190.1,
"r_x2": 86.4,
"r_y2": 181.2,
"r_x3": 62.1,
"r_y3": 181.2,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.6,
"r_y0": 189.8,
"r_x1": 98.7,
"r_y1": 189.8,
"r_x2": 98.7,
"r_y2": 181.0,
"r_x3": 88.6,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "T$_{a}$",
"orig": "T$_{a}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 101.4,
"r_y0": 190.1,
"r_x1": 115.8,
"r_y1": 190.1,
"r_x2": 115.8,
"r_y2": 181.2,
"r_x3": 101.4,
"r_y3": 181.2,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 118.0,
"r_y0": 189.8,
"r_x1": 127.3,
"r_y1": 189.8,
"r_x2": 127.3,
"r_y2": 181.0,
"r_x3": 118.0,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "T$_{b}$",
"orig": "T$_{b}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 130.0,
"r_y0": 190.1,
"r_x1": 286.4,
"r_y1": 190.1,
"r_x2": 286.4,
"r_y2": 181.2,
"r_x3": 130.0,
"r_y3": 181.2,
"coord_origin": "TOPLEFT"
},
"text": "represent tables in tree structure HTML",
"orig": "represent tables in tree structure HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 202.0,
"r_x1": 252.8,
"r_y1": 202.0,
"r_x2": 252.8,
"r_y2": 193.1,
"r_x3": 50.1,
"r_y3": 193.1,
"coord_origin": "TOPLEFT"
},
"text": "format. EditDist denotes the tree-edit distance, and",
"orig": "format. EditDist denotes the tree-edit distance, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.2,
"r_y0": 201.8,
"r_x1": 257.9,
"r_y1": 201.8,
"r_x2": 257.9,
"r_y2": 192.4,
"r_x3": 255.2,
"r_y3": 192.4,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 257.9,
"r_y0": 201.8,
"r_x1": 263.8,
"r_y1": 201.8,
"r_x2": 263.8,
"r_y2": 193.0,
"r_x3": 257.9,
"r_y3": 193.0,
"coord_origin": "TOPLEFT"
},
"text": "T",
"orig": "T",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 265.2,
"r_y0": 201.8,
"r_x1": 267.9,
"r_y1": 201.8,
"r_x2": 267.9,
"r_y2": 192.4,
"r_x3": 265.2,
"r_y3": 192.4,
"coord_origin": "TOPLEFT"
},
"text": "|",
"orig": "|",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 270.3,
"r_y0": 202.0,
"r_x1": 286.4,
"r_y1": 202.0,
"r_x2": 286.4,
"r_y2": 193.1,
"r_x3": 270.3,
"r_y3": 193.1,
"coord_origin": "TOPLEFT"
},
"text": "rep-",
"orig": "rep-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 214.0,
"r_x1": 172.1,
"r_y1": 214.0,
"r_x2": 172.1,
"r_y2": 205.1,
"r_x3": 50.1,
"r_y3": 205.1,
"coord_origin": "TOPLEFT"
},
"text": "resents the number of nodes in",
"orig": "resents the number of nodes in",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 174.6,
"r_y0": 213.8,
"r_x1": 180.4,
"r_y1": 213.8,
"r_x2": 180.4,
"r_y2": 204.9,
"r_x3": 174.6,
"r_y3": 204.9,
"coord_origin": "TOPLEFT"
},
"text": "T",
"orig": "T",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 181.8,
"r_y0": 214.0,
"r_x1": 184.3,
"r_y1": 214.0,
"r_x2": 184.3,
"r_y2": 205.1,
"r_x3": 181.8,
"r_y3": 205.1,
"coord_origin": "TOPLEFT"
},
"text": ".",
"orig": ".",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "where T$_{a}$ and T$_{b}$ represent tables in tree structure HTML format. EditDist denotes the tree-edit distance, and | T | represents the number of nodes in T ."
},
{
"label": "section_header",
"id": 9,
"page_no": 6,
"cluster": {
"id": 9,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 224.8,
"r": 170.5,
"b": 234.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 234.7,
"r_x1": 64.6,
"r_y1": 234.7,
"r_x2": 64.6,
"r_y2": 224.8,
"r_x3": 50.1,
"r_y3": 224.8,
"coord_origin": "TOPLEFT"
},
"text": "5.4.",
"orig": "5.4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.2,
"r_y0": 234.7,
"r_x1": 170.5,
"r_y1": 234.7,
"r_x2": 170.5,
"r_y2": 224.8,
"r_x3": 74.2,
"r_y3": 224.8,
"coord_origin": "TOPLEFT"
},
"text": "Quantitative Analysis",
"orig": "Quantitative Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5.4. Quantitative Analysis"
},
{
"label": "text",
"id": 2,
"page_no": 6,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 50.1,
"t": 243.6,
"r": 286.4,
"b": 396.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 252.6,
"r_x1": 105.3,
"r_y1": 252.6,
"r_x2": 105.3,
"r_y2": 243.6,
"r_x3": 62.1,
"r_y3": 243.6,
"coord_origin": "TOPLEFT"
},
"text": "Structure.",
"orig": "Structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.1,
"r_y0": 252.7,
"r_x1": 184.7,
"r_y1": 252.7,
"r_x2": 184.7,
"r_y2": 243.8,
"r_x3": 112.1,
"r_y3": 243.8,
"coord_origin": "TOPLEFT"
},
"text": "As shown in Tab.",
"orig": "As shown in Tab.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 191.5,
"r_y0": 252.7,
"r_x1": 286.4,
"r_y1": 252.7,
"r_x2": 286.4,
"r_y2": 243.8,
"r_x3": 191.5,
"r_y3": 243.8,
"coord_origin": "TOPLEFT"
},
"text": "2, TableFormer outper-",
"orig": "2, TableFormer outper-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 264.6,
"r_x1": 286.4,
"r_y1": 264.6,
"r_x2": 286.4,
"r_y2": 255.7,
"r_x3": 50.1,
"r_y3": 255.7,
"coord_origin": "TOPLEFT"
},
"text": "forms all SOTA methods across different datasets by a large",
"orig": "forms all SOTA methods across different datasets by a large",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 276.6,
"r_x1": 286.4,
"r_y1": 276.6,
"r_x2": 286.4,
"r_y2": 267.7,
"r_x3": 50.1,
"r_y3": 267.7,
"coord_origin": "TOPLEFT"
},
"text": "margin for predicting the table structure from an image.",
"orig": "margin for predicting the table structure from an image.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 288.5,
"r_x1": 286.4,
"r_y1": 288.5,
"r_x2": 286.4,
"r_y2": 279.6,
"r_x3": 50.1,
"r_y3": 279.6,
"coord_origin": "TOPLEFT"
},
"text": "All the more, our model outperforms pre-trained methods.",
"orig": "All the more, our model outperforms pre-trained methods.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 300.5,
"r_x1": 286.4,
"r_y1": 300.5,
"r_x2": 286.4,
"r_y2": 291.6,
"r_x3": 50.1,
"r_y3": 291.6,
"coord_origin": "TOPLEFT"
},
"text": "During the evaluation we do not apply any table filtering.",
"orig": "During the evaluation we do not apply any table filtering.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 312.5,
"r_x1": 286.4,
"r_y1": 312.5,
"r_x2": 286.4,
"r_y2": 303.5,
"r_x3": 50.1,
"r_y3": 303.5,
"coord_origin": "TOPLEFT"
},
"text": "We also provide our baseline results on the SynthTabNet",
"orig": "We also provide our baseline results on the SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 324.4,
"r_x1": 286.4,
"r_y1": 324.4,
"r_x2": 286.4,
"r_y2": 315.5,
"r_x3": 50.1,
"r_y3": 315.5,
"coord_origin": "TOPLEFT"
},
"text": "dataset. It has been observed that large tables (e.g. tables",
"orig": "dataset. It has been observed that large tables (e.g. tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 336.4,
"r_x1": 286.4,
"r_y1": 336.4,
"r_x2": 286.4,
"r_y2": 327.5,
"r_x3": 50.1,
"r_y3": 327.5,
"coord_origin": "TOPLEFT"
},
"text": "that occupy half of the page or more) yield poor predictions.",
"orig": "that occupy half of the page or more) yield poor predictions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 348.3,
"r_x1": 286.4,
"r_y1": 348.3,
"r_x2": 286.4,
"r_y2": 339.4,
"r_x3": 50.1,
"r_y3": 339.4,
"coord_origin": "TOPLEFT"
},
"text": "We attribute this issue to the image resizing during the pre-",
"orig": "We attribute this issue to the image resizing during the pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 360.3,
"r_x1": 286.4,
"r_y1": 360.3,
"r_x2": 286.4,
"r_y2": 351.4,
"r_x3": 50.1,
"r_y3": 351.4,
"coord_origin": "TOPLEFT"
},
"text": "processing step, that produces downsampled images with",
"orig": "processing step, that produces downsampled images with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 372.2,
"r_x1": 286.4,
"r_y1": 372.2,
"r_x2": 286.4,
"r_y2": 363.3,
"r_x3": 50.1,
"r_y3": 363.3,
"coord_origin": "TOPLEFT"
},
"text": "indistinguishable features. This problem can be addressed",
"orig": "indistinguishable features. This problem can be addressed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 384.2,
"r_x1": 286.4,
"r_y1": 384.2,
"r_x2": 286.4,
"r_y2": 375.3,
"r_x3": 50.1,
"r_y3": 375.3,
"coord_origin": "TOPLEFT"
},
"text": "by treating such big tables with a separate model which ac-",
"orig": "by treating such big tables with a separate model which ac-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 396.1,
"r_x1": 170.0,
"r_y1": 396.1,
"r_x2": 170.0,
"r_y2": 387.2,
"r_x3": 50.1,
"r_y3": 387.2,
"coord_origin": "TOPLEFT"
},
"text": "cepts a large input image size.",
"orig": "cepts a large input image size.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Structure. As shown in Tab. 2, TableFormer outperforms all SOTA methods across different datasets by a large margin for predicting the table structure from an image. All the more, our model outperforms pre-trained methods. During the evaluation we do not apply any table filtering. We also provide our baseline results on the SynthTabNet dataset. It has been observed that large tables (e.g. tables that occupy half of the page or more) yield poor predictions. We attribute this issue to the image resizing during the preprocessing step, that produces downsampled images with indistinguishable features. This problem can be addressed by treating such big tables with a separate model which accepts a large input image size."
},
{
"label": "table",
"id": 0,
"page_no": 6,
"cluster": {
"id": 0,
"label": "table",
"bbox": {
"l": 53.4,
"t": 409.1,
"r": 283.0,
"b": 582.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.8,
"r_y0": 429.6,
"r_x1": 104.9,
"r_y1": 429.6,
"r_x2": 104.9,
"r_y2": 420.7,
"r_x3": 78.8,
"r_y3": 420.7,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.2,
"r_y0": 423.6,
"r_x1": 236.1,
"r_y1": 423.6,
"r_x2": 236.1,
"r_y2": 414.7,
"r_x3": 211.2,
"r_y3": 414.7,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 129.3,
"r_y0": 435.6,
"r_x1": 159.2,
"r_y1": 435.6,
"r_x2": 159.2,
"r_y2": 426.7,
"r_x3": 129.3,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.2,
"r_y0": 435.6,
"r_x1": 199.4,
"r_y1": 435.6,
"r_x2": 199.4,
"r_y2": 426.7,
"r_x3": 171.2,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.4,
"r_y0": 435.6,
"r_x1": 247.7,
"r_y1": 435.6,
"r_x2": 247.7,
"r_y2": 426.7,
"r_x3": 211.4,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 264.5,
"r_y0": 435.6,
"r_x1": 277.3,
"r_y1": 435.6,
"r_x2": 277.3,
"r_y2": 426.7,
"r_x3": 264.5,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 452.5,
"r_x1": 102.1,
"r_y1": 452.5,
"r_x2": 102.1,
"r_y2": 443.6,
"r_x3": 81.6,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 452.5,
"r_x1": 153.7,
"r_y1": 452.5,
"r_x2": 153.7,
"r_y2": 443.6,
"r_x3": 134.9,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 452.5,
"r_x1": 194.0,
"r_y1": 452.5,
"r_x2": 194.0,
"r_y2": 443.6,
"r_x3": 176.6,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "91.1",
"orig": "91.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 452.5,
"r_x1": 238.3,
"r_y1": 452.5,
"r_x2": 238.3,
"r_y2": 443.6,
"r_x3": 220.8,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "88.7",
"orig": "88.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 452.5,
"r_x1": 279.6,
"r_y1": 452.5,
"r_x2": 279.6,
"r_y2": 443.6,
"r_x3": 262.2,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "89.9",
"orig": "89.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.2,
"r_y0": 464.5,
"r_x1": 101.5,
"r_y1": 464.5,
"r_x2": 101.5,
"r_y2": 455.6,
"r_x3": 82.2,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 464.5,
"r_x1": 153.7,
"r_y1": 464.5,
"r_x2": 153.7,
"r_y2": 455.6,
"r_x3": 134.9,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 464.5,
"r_x1": 186.9,
"r_y1": 464.5,
"r_x2": 186.9,
"r_y2": 455.6,
"r_x3": 183.6,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 464.5,
"r_x1": 231.2,
"r_y1": 464.5,
"r_x2": 231.2,
"r_y2": 455.6,
"r_x3": 227.9,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 464.5,
"r_x1": 282.1,
"r_y1": 464.5,
"r_x2": 282.1,
"r_y2": 455.6,
"r_x3": 259.7,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "93.01",
"orig": "93.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 477.0,
"r_x1": 117.4,
"r_y1": 477.0,
"r_x2": 117.4,
"r_y2": 468.1,
"r_x3": 66.3,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 477.0,
"r_x1": 153.7,
"r_y1": 477.0,
"r_x2": 153.7,
"r_y2": 468.1,
"r_x3": 134.9,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 477.0,
"r_x1": 194.0,
"r_y1": 477.0,
"r_x2": 194.0,
"r_y2": 468.1,
"r_x3": 176.6,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "98.5",
"orig": "98.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 477.0,
"r_x1": 238.3,
"r_y1": 477.0,
"r_x2": 238.3,
"r_y2": 468.1,
"r_x3": 220.8,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "95.0",
"orig": "95.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 477.0,
"r_x1": 282.1,
"r_y1": 477.0,
"r_x2": 282.1,
"r_y2": 468.0,
"r_x3": 259.7,
"r_y3": 468.0,
"coord_origin": "TOPLEFT"
},
"text": "96.75",
"orig": "96.75",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 492.2,
"r_x1": 102.1,
"r_y1": 492.2,
"r_x2": 102.1,
"r_y2": 483.3,
"r_x3": 81.6,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 492.2,
"r_x1": 153.7,
"r_y1": 492.2,
"r_x2": 153.7,
"r_y2": 483.3,
"r_x3": 134.9,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 492.2,
"r_x1": 194.0,
"r_y1": 492.2,
"r_x2": 194.0,
"r_y2": 483.3,
"r_x3": 176.6,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "88.4",
"orig": "88.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.3,
"r_y0": 492.2,
"r_x1": 240.8,
"r_y1": 492.2,
"r_x2": 240.8,
"r_y2": 483.3,
"r_x3": 218.3,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "92.08",
"orig": "92.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 492.2,
"r_x1": 279.6,
"r_y1": 492.2,
"r_x2": 279.6,
"r_y2": 483.3,
"r_x3": 262.2,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "90.6",
"orig": "90.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.2,
"r_y0": 504.2,
"r_x1": 101.5,
"r_y1": 504.2,
"r_x2": 101.5,
"r_y2": 495.3,
"r_x3": 82.2,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 504.2,
"r_x1": 153.7,
"r_y1": 504.2,
"r_x2": 153.7,
"r_y2": 495.3,
"r_x3": 134.9,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 504.2,
"r_x1": 186.9,
"r_y1": 504.2,
"r_x2": 186.9,
"r_y2": 495.3,
"r_x3": 183.6,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 504.2,
"r_x1": 231.2,
"r_y1": 504.2,
"r_x2": 231.2,
"r_y2": 495.3,
"r_x3": 227.9,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 504.2,
"r_x1": 282.1,
"r_y1": 504.2,
"r_x2": 282.1,
"r_y2": 495.3,
"r_x3": 259.7,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "87.14",
"orig": "87.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.8,
"r_y0": 516.1,
"r_x1": 111.9,
"r_y1": 516.1,
"r_x2": 111.9,
"r_y2": 507.2,
"r_x3": 71.8,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "GTE (FT)",
"orig": "GTE (FT)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 516.1,
"r_x1": 153.7,
"r_y1": 516.1,
"r_x2": 153.7,
"r_y2": 507.2,
"r_x3": 134.9,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 516.1,
"r_x1": 186.9,
"r_y1": 516.1,
"r_x2": 186.9,
"r_y2": 507.2,
"r_x3": 183.6,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 516.1,
"r_x1": 231.2,
"r_y1": 516.1,
"r_x2": 231.2,
"r_y2": 507.2,
"r_x3": 227.9,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 516.1,
"r_x1": 282.1,
"r_y1": 516.1,
"r_x2": 282.1,
"r_y2": 507.2,
"r_x3": 259.7,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "91.02",
"orig": "91.02",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 528.1,
"r_x1": 117.4,
"r_y1": 528.1,
"r_x2": 117.4,
"r_y2": 519.2,
"r_x3": 66.3,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 528.1,
"r_x1": 153.7,
"r_y1": 528.1,
"r_x2": 153.7,
"r_y2": 519.2,
"r_x3": 134.9,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 528.1,
"r_x1": 194.0,
"r_y1": 528.1,
"r_x2": 194.0,
"r_y2": 519.2,
"r_x3": 176.6,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "97.5",
"orig": "97.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 528.1,
"r_x1": 238.3,
"r_y1": 528.1,
"r_x2": 238.3,
"r_y2": 519.2,
"r_x3": 220.8,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "96.0",
"orig": "96.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 528.0,
"r_x1": 279.6,
"r_y1": 528.0,
"r_x2": 279.6,
"r_y2": 519.1,
"r_x3": 262.2,
"r_y3": 519.1,
"coord_origin": "TOPLEFT"
},
"text": "96.8",
"orig": "96.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 545.4,
"r_x1": 102.1,
"r_y1": 545.4,
"r_x2": 102.1,
"r_y2": 536.5,
"r_x3": 81.6,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.9,
"r_y0": 545.4,
"r_x1": 150.6,
"r_y1": 545.4,
"r_x2": 150.6,
"r_y2": 536.5,
"r_x3": 137.9,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 545.4,
"r_x1": 194.0,
"r_y1": 545.4,
"r_x2": 194.0,
"r_y2": 536.5,
"r_x3": 176.6,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 545.4,
"r_x1": 231.2,
"r_y1": 545.4,
"r_x2": 231.2,
"r_y2": 536.5,
"r_x3": 227.9,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 545.4,
"r_x1": 279.6,
"r_y1": 545.4,
"r_x2": 279.6,
"r_y2": 536.5,
"r_x3": 262.2,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 557.4,
"r_x1": 117.4,
"r_y1": 557.4,
"r_x2": 117.4,
"r_y2": 548.5,
"r_x3": 66.3,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.9,
"r_y0": 557.4,
"r_x1": 150.6,
"r_y1": 557.4,
"r_x2": 150.6,
"r_y2": 548.5,
"r_x3": 137.9,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 557.4,
"r_x1": 194.0,
"r_y1": 557.4,
"r_x2": 194.0,
"r_y2": 548.5,
"r_x3": 176.6,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 557.4,
"r_x1": 231.2,
"r_y1": 557.4,
"r_x2": 231.2,
"r_y2": 548.5,
"r_x3": 227.9,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 557.3,
"r_x1": 279.6,
"r_y1": 557.3,
"r_x2": 279.6,
"r_y2": 548.3,
"r_x3": 262.2,
"r_y3": 548.3,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 576.9,
"r_x1": 117.4,
"r_y1": 576.9,
"r_x2": 117.4,
"r_y2": 568.0,
"r_x3": 66.3,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 576.9,
"r_x1": 153.7,
"r_y1": 576.9,
"r_x2": 153.7,
"r_y2": 568.0,
"r_x3": 134.9,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "STN",
"orig": "STN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 576.9,
"r_x1": 194.0,
"r_y1": 576.9,
"r_x2": 194.0,
"r_y2": 568.0,
"r_x3": 176.6,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.9",
"orig": "96.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 576.9,
"r_x1": 238.3,
"r_y1": 576.9,
"r_x2": 238.3,
"r_y2": 568.0,
"r_x3": 220.8,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "95.7",
"orig": "95.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 576.9,
"r_x1": 279.6,
"r_y1": 576.9,
"r_x2": 279.6,
"r_y2": 568.0,
"r_x3": 262.2,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.7",
"orig": "96.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 27,
"label": "text",
"bbox": {
"l": 78.8,
"t": 420.7,
"r": 104.9,
"b": 429.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.8,
"r_y0": 429.6,
"r_x1": 104.9,
"r_y1": 429.6,
"r_x2": 104.9,
"r_y2": 420.7,
"r_x3": 78.8,
"r_y3": 420.7,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 28,
"label": "text",
"bbox": {
"l": 211.2,
"t": 414.7,
"r": 236.1,
"b": 423.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.2,
"r_y0": 423.6,
"r_x1": 236.1,
"r_y1": 423.6,
"r_x2": 236.1,
"r_y2": 414.7,
"r_x3": 211.2,
"r_y3": 414.7,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "text",
"bbox": {
"l": 129.3,
"t": 426.7,
"r": 159.2,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 129.3,
"r_y0": 435.6,
"r_x1": 159.2,
"r_y1": 435.6,
"r_x2": 159.2,
"r_y2": 426.7,
"r_x3": 129.3,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 30,
"label": "text",
"bbox": {
"l": 171.2,
"t": 426.7,
"r": 199.4,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.2,
"r_y0": 435.6,
"r_x1": 199.4,
"r_y1": 435.6,
"r_x2": 199.4,
"r_y2": 426.7,
"r_x3": 171.2,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "text",
"bbox": {
"l": 211.4,
"t": 426.7,
"r": 247.7,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.4,
"r_y0": 435.6,
"r_x1": 247.7,
"r_y1": 435.6,
"r_x2": 247.7,
"r_y2": 426.7,
"r_x3": 211.4,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 32,
"label": "text",
"bbox": {
"l": 264.5,
"t": 426.7,
"r": 277.3,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 264.5,
"r_y0": 435.6,
"r_x1": 277.3,
"r_y1": 435.6,
"r_x2": 277.3,
"r_y2": 426.7,
"r_x3": 264.5,
"r_y3": 426.7,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 33,
"label": "text",
"bbox": {
"l": 81.6,
"t": 443.6,
"r": 102.1,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 452.5,
"r_x1": 102.1,
"r_y1": 452.5,
"r_x2": 102.1,
"r_y2": 443.6,
"r_x3": 81.6,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 34,
"label": "text",
"bbox": {
"l": 134.9,
"t": 443.6,
"r": 153.7,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 452.5,
"r_x1": 153.7,
"r_y1": 452.5,
"r_x2": 153.7,
"r_y2": 443.6,
"r_x3": 134.9,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 35,
"label": "text",
"bbox": {
"l": 176.6,
"t": 443.6,
"r": 194.0,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 452.5,
"r_x1": 194.0,
"r_y1": 452.5,
"r_x2": 194.0,
"r_y2": 443.6,
"r_x3": 176.6,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "91.1",
"orig": "91.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 36,
"label": "text",
"bbox": {
"l": 220.8,
"t": 443.6,
"r": 238.3,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 452.5,
"r_x1": 238.3,
"r_y1": 452.5,
"r_x2": 238.3,
"r_y2": 443.6,
"r_x3": 220.8,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "88.7",
"orig": "88.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 37,
"label": "text",
"bbox": {
"l": 262.2,
"t": 443.6,
"r": 279.6,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 452.5,
"r_x1": 279.6,
"r_y1": 452.5,
"r_x2": 279.6,
"r_y2": 443.6,
"r_x3": 262.2,
"r_y3": 443.6,
"coord_origin": "TOPLEFT"
},
"text": "89.9",
"orig": "89.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 38,
"label": "text",
"bbox": {
"l": 82.2,
"t": 455.6,
"r": 101.5,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.2,
"r_y0": 464.5,
"r_x1": 101.5,
"r_y1": 464.5,
"r_x2": 101.5,
"r_y2": 455.6,
"r_x3": 82.2,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 39,
"label": "text",
"bbox": {
"l": 134.9,
"t": 455.6,
"r": 153.7,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 464.5,
"r_x1": 153.7,
"r_y1": 464.5,
"r_x2": 153.7,
"r_y2": 455.6,
"r_x3": 134.9,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 40,
"label": "text",
"bbox": {
"l": 183.6,
"t": 455.6,
"r": 186.9,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 464.5,
"r_x1": 186.9,
"r_y1": 464.5,
"r_x2": 186.9,
"r_y2": 455.6,
"r_x3": 183.6,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "text",
"bbox": {
"l": 227.9,
"t": 455.6,
"r": 231.2,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 464.5,
"r_x1": 231.2,
"r_y1": 464.5,
"r_x2": 231.2,
"r_y2": 455.6,
"r_x3": 227.9,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 42,
"label": "text",
"bbox": {
"l": 259.7,
"t": 455.6,
"r": 282.1,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 464.5,
"r_x1": 282.1,
"r_y1": 464.5,
"r_x2": 282.1,
"r_y2": 455.6,
"r_x3": 259.7,
"r_y3": 455.6,
"coord_origin": "TOPLEFT"
},
"text": "93.01",
"orig": "93.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 43,
"label": "text",
"bbox": {
"l": 66.3,
"t": 468.1,
"r": 117.4,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 477.0,
"r_x1": 117.4,
"r_y1": 477.0,
"r_x2": 117.4,
"r_y2": 468.1,
"r_x3": 66.3,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 44,
"label": "text",
"bbox": {
"l": 134.9,
"t": 468.1,
"r": 153.7,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 477.0,
"r_x1": 153.7,
"r_y1": 477.0,
"r_x2": 153.7,
"r_y2": 468.1,
"r_x3": 134.9,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "PTN",
"orig": "PTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 45,
"label": "text",
"bbox": {
"l": 176.6,
"t": 468.1,
"r": 194.0,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 477.0,
"r_x1": 194.0,
"r_y1": 477.0,
"r_x2": 194.0,
"r_y2": 468.1,
"r_x3": 176.6,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "98.5",
"orig": "98.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 46,
"label": "text",
"bbox": {
"l": 220.8,
"t": 468.1,
"r": 238.3,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 477.0,
"r_x1": 238.3,
"r_y1": 477.0,
"r_x2": 238.3,
"r_y2": 468.1,
"r_x3": 220.8,
"r_y3": 468.1,
"coord_origin": "TOPLEFT"
},
"text": "95.0",
"orig": "95.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 259.7,
"t": 468.0,
"r": 282.1,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 477.0,
"r_x1": 282.1,
"r_y1": 477.0,
"r_x2": 282.1,
"r_y2": 468.0,
"r_x3": 259.7,
"r_y3": 468.0,
"coord_origin": "TOPLEFT"
},
"text": "96.75",
"orig": "96.75",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 81.6,
"t": 483.3,
"r": 102.1,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 492.2,
"r_x1": 102.1,
"r_y1": 492.2,
"r_x2": 102.1,
"r_y2": 483.3,
"r_x3": 81.6,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 134.9,
"t": 483.3,
"r": 153.7,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 492.2,
"r_x1": 153.7,
"r_y1": 492.2,
"r_x2": 153.7,
"r_y2": 483.3,
"r_x3": 134.9,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 176.6,
"t": 483.3,
"r": 194.0,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 492.2,
"r_x1": 194.0,
"r_y1": 492.2,
"r_x2": 194.0,
"r_y2": 483.3,
"r_x3": 176.6,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "88.4",
"orig": "88.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 51,
"label": "text",
"bbox": {
"l": 218.3,
"t": 483.3,
"r": 240.8,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.3,
"r_y0": 492.2,
"r_x1": 240.8,
"r_y1": 492.2,
"r_x2": 240.8,
"r_y2": 483.3,
"r_x3": 218.3,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "92.08",
"orig": "92.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 52,
"label": "text",
"bbox": {
"l": 262.2,
"t": 483.3,
"r": 279.6,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 492.2,
"r_x1": 279.6,
"r_y1": 492.2,
"r_x2": 279.6,
"r_y2": 483.3,
"r_x3": 262.2,
"r_y3": 483.3,
"coord_origin": "TOPLEFT"
},
"text": "90.6",
"orig": "90.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 53,
"label": "text",
"bbox": {
"l": 82.2,
"t": 495.3,
"r": 101.5,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.2,
"r_y0": 504.2,
"r_x1": 101.5,
"r_y1": 504.2,
"r_x2": 101.5,
"r_y2": 495.3,
"r_x3": 82.2,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "GTE",
"orig": "GTE",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 54,
"label": "text",
"bbox": {
"l": 134.9,
"t": 495.3,
"r": 153.7,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 504.2,
"r_x1": 153.7,
"r_y1": 504.2,
"r_x2": 153.7,
"r_y2": 495.3,
"r_x3": 134.9,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 55,
"label": "text",
"bbox": {
"l": 183.6,
"t": 495.3,
"r": 186.9,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 504.2,
"r_x1": 186.9,
"r_y1": 504.2,
"r_x2": 186.9,
"r_y2": 495.3,
"r_x3": 183.6,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 227.9,
"t": 495.3,
"r": 231.2,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 504.2,
"r_x1": 231.2,
"r_y1": 504.2,
"r_x2": 231.2,
"r_y2": 495.3,
"r_x3": 227.9,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 259.7,
"t": 495.3,
"r": 282.1,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 504.2,
"r_x1": 282.1,
"r_y1": 504.2,
"r_x2": 282.1,
"r_y2": 495.3,
"r_x3": 259.7,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "87.14",
"orig": "87.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 71.8,
"t": 507.2,
"r": 111.9,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.8,
"r_y0": 516.1,
"r_x1": 111.9,
"r_y1": 516.1,
"r_x2": 111.9,
"r_y2": 507.2,
"r_x3": 71.8,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "GTE (FT)",
"orig": "GTE (FT)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 134.9,
"t": 507.2,
"r": 153.7,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 516.1,
"r_x1": 153.7,
"r_y1": 516.1,
"r_x2": 153.7,
"r_y2": 507.2,
"r_x3": 134.9,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 183.6,
"t": 507.2,
"r": 186.9,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.6,
"r_y0": 516.1,
"r_x1": 186.9,
"r_y1": 516.1,
"r_x2": 186.9,
"r_y2": 507.2,
"r_x3": 183.6,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 227.9,
"t": 507.2,
"r": 231.2,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 516.1,
"r_x1": 231.2,
"r_y1": 516.1,
"r_x2": 231.2,
"r_y2": 507.2,
"r_x3": 227.9,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 259.7,
"t": 507.2,
"r": 282.1,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 259.7,
"r_y0": 516.1,
"r_x1": 282.1,
"r_y1": 516.1,
"r_x2": 282.1,
"r_y2": 507.2,
"r_x3": 259.7,
"r_y3": 507.2,
"coord_origin": "TOPLEFT"
},
"text": "91.02",
"orig": "91.02",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 66.3,
"t": 519.2,
"r": 117.4,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 528.1,
"r_x1": 117.4,
"r_y1": 528.1,
"r_x2": 117.4,
"r_y2": 519.2,
"r_x3": 66.3,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 134.9,
"t": 519.2,
"r": 153.7,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 528.1,
"r_x1": 153.7,
"r_y1": 528.1,
"r_x2": 153.7,
"r_y2": 519.2,
"r_x3": 134.9,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "FTN",
"orig": "FTN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 176.6,
"t": 519.2,
"r": 194.0,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 528.1,
"r_x1": 194.0,
"r_y1": 528.1,
"r_x2": 194.0,
"r_y2": 519.2,
"r_x3": 176.6,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "97.5",
"orig": "97.5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 220.8,
"t": 519.2,
"r": 238.3,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 528.1,
"r_x1": 238.3,
"r_y1": 528.1,
"r_x2": 238.3,
"r_y2": 519.2,
"r_x3": 220.8,
"r_y3": 519.2,
"coord_origin": "TOPLEFT"
},
"text": "96.0",
"orig": "96.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 262.2,
"t": 519.1,
"r": 279.6,
"b": 528.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 528.0,
"r_x1": 279.6,
"r_y1": 528.0,
"r_x2": 279.6,
"r_y2": 519.1,
"r_x3": 262.2,
"r_y3": 519.1,
"coord_origin": "TOPLEFT"
},
"text": "96.8",
"orig": "96.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 81.6,
"t": 536.5,
"r": 102.1,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.6,
"r_y0": 545.4,
"r_x1": 102.1,
"r_y1": 545.4,
"r_x2": 102.1,
"r_y2": 536.5,
"r_x3": 81.6,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 137.9,
"t": 536.5,
"r": 150.6,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.9,
"r_y0": 545.4,
"r_x1": 150.6,
"r_y1": 545.4,
"r_x2": 150.6,
"r_y2": 536.5,
"r_x3": 137.9,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 176.6,
"t": 536.5,
"r": 194.0,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 545.4,
"r_x1": 194.0,
"r_y1": 545.4,
"r_x2": 194.0,
"r_y2": 536.5,
"r_x3": 176.6,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 227.9,
"t": 536.5,
"r": 231.2,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 545.4,
"r_x1": 231.2,
"r_y1": 545.4,
"r_x2": 231.2,
"r_y2": 536.5,
"r_x3": 227.9,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 262.2,
"t": 536.5,
"r": 279.6,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 545.4,
"r_x1": 279.6,
"r_y1": 545.4,
"r_x2": 279.6,
"r_y2": 536.5,
"r_x3": 262.2,
"r_y3": 536.5,
"coord_origin": "TOPLEFT"
},
"text": "86.0",
"orig": "86.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 66.3,
"t": 548.5,
"r": 117.4,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 557.4,
"r_x1": 117.4,
"r_y1": 557.4,
"r_x2": 117.4,
"r_y2": 548.5,
"r_x3": 66.3,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 137.9,
"t": 548.5,
"r": 150.6,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 137.9,
"r_y0": 557.4,
"r_x1": 150.6,
"r_y1": 557.4,
"r_x2": 150.6,
"r_y2": 548.5,
"r_x3": 137.9,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "TB",
"orig": "TB",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 176.6,
"t": 548.5,
"r": 194.0,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 557.4,
"r_x1": 194.0,
"r_y1": 557.4,
"r_x2": 194.0,
"r_y2": 548.5,
"r_x3": 176.6,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 227.9,
"t": 548.5,
"r": 231.2,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.9,
"r_y0": 557.4,
"r_x1": 231.2,
"r_y1": 557.4,
"r_x2": 231.2,
"r_y2": 548.5,
"r_x3": 227.9,
"r_y3": 548.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 262.2,
"t": 548.3,
"r": 279.6,
"b": 557.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 557.3,
"r_x1": 279.6,
"r_y1": 557.3,
"r_x2": 279.6,
"r_y2": 548.3,
"r_x3": 262.2,
"r_y3": 548.3,
"coord_origin": "TOPLEFT"
},
"text": "89.6",
"orig": "89.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 66.3,
"t": 568.0,
"r": 117.4,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.3,
"r_y0": 576.9,
"r_x1": 117.4,
"r_y1": 576.9,
"r_x2": 117.4,
"r_y2": 568.0,
"r_x3": 66.3,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 134.9,
"t": 568.0,
"r": 153.7,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 134.9,
"r_y0": 576.9,
"r_x1": 153.7,
"r_y1": 576.9,
"r_x2": 153.7,
"r_y2": 568.0,
"r_x3": 134.9,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "STN",
"orig": "STN",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 176.6,
"t": 568.0,
"r": 194.0,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 176.6,
"r_y0": 576.9,
"r_x1": 194.0,
"r_y1": 576.9,
"r_x2": 194.0,
"r_y2": 568.0,
"r_x3": 176.6,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.9",
"orig": "96.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 220.8,
"t": 568.0,
"r": 238.3,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 576.9,
"r_x1": 238.3,
"r_y1": 576.9,
"r_x2": 238.3,
"r_y2": 568.0,
"r_x3": 220.8,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "95.7",
"orig": "95.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 262.2,
"t": 568.0,
"r": 279.6,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 262.2,
"r_y0": 576.9,
"r_x1": 279.6,
"r_y1": 576.9,
"r_x2": 279.6,
"r_y2": 568.0,
"r_x3": 262.2,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "96.7",
"orig": "96.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 11,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 78.8,
"t": 420.7,
"r": 104.9,
"b": 429.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Model",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 211.2,
"t": 414.7,
"r": 236.1,
"b": 423.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "TEDS Complex",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 129.3,
"t": 426.7,
"r": 159.2,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Dataset",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 171.2,
"t": 426.7,
"r": 199.4,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "Simple",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 264.5,
"t": 426.7,
"r": 277.3,
"b": 435.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "All",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 81.6,
"t": 443.6,
"r": 102.1,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 443.6,
"r": 153.7,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.6,
"t": 443.6,
"r": 194.0,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "91.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.8,
"t": 443.6,
"r": 238.3,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "88.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.2,
"t": 443.6,
"r": 279.6,
"b": 452.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "89.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 82.2,
"t": 455.6,
"r": 101.5,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "GTE",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 455.6,
"r": 153.7,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 183.6,
"t": 455.6,
"r": 186.9,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.9,
"t": 455.6,
"r": 231.2,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.7,
"t": 455.6,
"r": 282.1,
"b": 464.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "93.01",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.3,
"t": 468.1,
"r": 117.4,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 468.1,
"r": 153.7,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.6,
"t": 468.1,
"r": 194.0,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "98.5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.8,
"t": 468.1,
"r": 238.3,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "95.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.7,
"t": 468.0,
"r": 282.1,
"b": 477.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "96.75",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 81.6,
"t": 483.3,
"r": 102.1,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 483.3,
"r": 153.7,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.6,
"t": 483.3,
"r": 194.0,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "88.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 218.3,
"t": 483.3,
"r": 240.8,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "92.08",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.2,
"t": 483.3,
"r": 279.6,
"b": 492.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "90.6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 82.2,
"t": 495.3,
"r": 101.5,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "GTE",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 495.3,
"r": 153.7,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 183.6,
"t": 495.3,
"r": 186.9,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.9,
"t": 495.3,
"r": 231.2,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.7,
"t": 495.3,
"r": 282.1,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "87.14",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 71.8,
"t": 507.2,
"r": 111.9,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "GTE (FT)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 507.2,
"r": 153.7,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 183.6,
"t": 507.2,
"r": 186.9,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.9,
"t": 507.2,
"r": 231.2,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 259.7,
"t": 507.2,
"r": 282.1,
"b": 516.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "91.02",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.3,
"t": 519.2,
"r": 117.4,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 519.2,
"r": 153.7,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "FTN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.6,
"t": 519.2,
"r": 194.0,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "97.5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.8,
"t": 519.2,
"r": 238.3,
"b": 528.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "96.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.2,
"t": 519.1,
"r": 279.6,
"b": 528.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "96.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 81.6,
"t": 536.5,
"r": 102.1,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 137.9,
"t": 536.5,
"r": 150.6,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "TB",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.6,
"t": 536.5,
"r": 194.0,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "86.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.9,
"t": 536.5,
"r": 231.2,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.2,
"t": 536.5,
"r": 279.6,
"b": 545.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "86.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.3,
"t": 548.5,
"r": 117.4,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 137.9,
"t": 548.5,
"r": 150.6,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "TB",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.6,
"t": 548.5,
"r": 194.0,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "89.6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 227.9,
"t": 548.5,
"r": 231.2,
"b": 557.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.2,
"t": 548.3,
"r": 279.6,
"b": 557.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "89.6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 66.3,
"t": 568.0,
"r": 117.4,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 134.9,
"t": 568.0,
"r": 153.7,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "STN",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 176.6,
"t": 568.0,
"r": 194.0,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "96.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 220.8,
"t": 568.0,
"r": 238.3,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "95.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 262.2,
"t": 568.0,
"r": 279.6,
"b": 576.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 10,
"end_row_offset_idx": 11,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "96.7",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "text",
"id": 15,
"page_no": 6,
"cluster": {
"id": 15,
"label": "text",
"bbox": {
"l": 50.1,
"t": 592.4,
"r": 286.4,
"b": 613.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.72,
"cells": [
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 601.3,
"r_x1": 286.4,
"r_y1": 601.3,
"r_x2": 286.4,
"r_y2": 592.4,
"r_x3": 50.1,
"r_y3": 592.4,
"coord_origin": "TOPLEFT"
},
"text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet",
"orig": "Table 2: Structure results on PubTabNet (PTN), FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 613.3,
"r_x1": 247.5,
"r_y1": 613.3,
"r_x2": 247.5,
"r_y2": 604.4,
"r_x3": 50.1,
"r_y3": 604.4,
"coord_origin": "TOPLEFT"
},
"text": "(FTN), TableBank (TB) and SynthTabNet (STN).",
"orig": "(FTN), TableBank (TB) and SynthTabNet (STN).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet (FTN), TableBank (TB) and SynthTabNet (STN)."
},
{
"label": "text",
"id": 16,
"page_no": 6,
"cluster": {
"id": 16,
"label": "text",
"bbox": {
"l": 50.1,
"t": 616.3,
"r": 261.8,
"b": 625.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.64,
"cells": [
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 625.2,
"r_x1": 261.8,
"r_y1": 625.2,
"r_x2": 261.8,
"r_y2": 616.3,
"r_x3": 50.1,
"r_y3": 616.3,
"coord_origin": "TOPLEFT"
},
"text": "FT: Model was trained on PubTabNet then finetuned.",
"orig": "FT: Model was trained on PubTabNet then finetuned.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "FT: Model was trained on PubTabNet then finetuned."
},
{
"label": "text",
"id": 3,
"page_no": 6,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 50.1,
"t": 644.3,
"r": 286.4,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 653.3,
"r_x1": 124.7,
"r_y1": 653.3,
"r_x2": 124.7,
"r_y2": 644.3,
"r_x3": 62.1,
"r_y3": 644.3,
"coord_origin": "TOPLEFT"
},
"text": "Cell Detection.",
"orig": "Cell Detection.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 128.2,
"r_y0": 653.4,
"r_x1": 242.9,
"r_y1": 653.4,
"r_x2": 242.9,
"r_y2": 644.5,
"r_x3": 128.2,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "Like any object detector, our",
"orig": "Like any object detector, our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 245.6,
"r_y0": 653.1,
"r_x1": 286.4,
"r_y1": 653.1,
"r_x2": 286.4,
"r_y2": 644.6,
"r_x3": 245.6,
"r_y3": 644.6,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox",
"orig": "Cell BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 665.1,
"r_x1": 85.0,
"r_y1": 665.1,
"r_x2": 85.0,
"r_y2": 656.5,
"r_x3": 50.1,
"r_y3": 656.5,
"coord_origin": "TOPLEFT"
},
"text": "Detector",
"orig": "Detector",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.5,
"r_y0": 665.3,
"r_x1": 286.4,
"r_y1": 665.3,
"r_x2": 286.4,
"r_y2": 656.4,
"r_x3": 89.5,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "provides bounding boxes that can be improved",
"orig": "provides bounding boxes that can be improved",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.3,
"r_x1": 286.4,
"r_y1": 677.3,
"r_x2": 286.4,
"r_y2": 668.4,
"r_x3": 50.1,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "with post-processing during inference. We make use of the",
"orig": "with post-processing during inference. We make use of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 689.2,
"r_x1": 286.4,
"r_y1": 689.2,
"r_x2": 286.4,
"r_y2": 680.3,
"r_x3": 50.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "grid-like structure of tables to refine the predictions. A de-",
"orig": "grid-like structure of tables to refine the predictions. A de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "tailed explanation on the post-processing is available in the",
"orig": "tailed explanation on the post-processing is available in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 286.4,
"r_y1": 713.2,
"r_x2": 286.4,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "supplementary material. As shown in Tab. 3, we evaluate",
"orig": "supplementary material. As shown in Tab. 3, we evaluate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Cell Detection. Like any object detector, our Cell BBox Detector provides bounding boxes that can be improved with post-processing during inference. We make use of the grid-like structure of tables to refine the predictions. A detailed explanation on the post-processing is available in the supplementary material. As shown in Tab. 3, we evaluate"
},
{
"label": "text",
"id": 7,
"page_no": 6,
"cluster": {
"id": 7,
"label": "text",
"bbox": {
"l": 308.9,
"t": 75.2,
"r": 545.1,
"b": 227.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 84.1,
"r_x1": 322.1,
"r_y1": 84.1,
"r_x2": 322.1,
"r_y2": 75.2,
"r_x3": 308.9,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "our",
"orig": "our",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 325.5,
"r_y0": 83.9,
"r_x1": 404.6,
"r_y1": 83.9,
"r_x2": 404.6,
"r_y2": 75.3,
"r_x3": 325.5,
"r_y3": 75.3,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.1,
"r_y0": 84.1,
"r_x1": 545.1,
"r_y1": 84.1,
"r_x2": 545.1,
"r_y2": 75.2,
"r_x3": 408.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "accuracy for cells with a class la-",
"orig": "accuracy for cells with a class la-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 96.1,
"r_x1": 545.1,
"r_y1": 96.1,
"r_x2": 545.1,
"r_y2": 87.2,
"r_x3": 308.9,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric",
"orig": "bel of \u2018content\u2019 only using the PASCAL VOC mAP metric",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 108.0,
"r_x1": 470.2,
"r_y1": 108.0,
"r_x2": 470.2,
"r_y2": 99.1,
"r_x3": 308.9,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "for pre-processing and post-processing.",
"orig": "for pre-processing and post-processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 477.5,
"r_y0": 108.0,
"r_x1": 545.1,
"r_y1": 108.0,
"r_x2": 545.1,
"r_y2": 99.1,
"r_x3": 477.5,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "Note that we do",
"orig": "Note that we do",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 120.0,
"r_x1": 545.1,
"r_y1": 120.0,
"r_x2": 545.1,
"r_y2": 111.1,
"r_x3": 308.9,
"r_y3": 111.1,
"coord_origin": "TOPLEFT"
},
"text": "not have post-processing results for SynthTabNet as images",
"orig": "not have post-processing results for SynthTabNet as images",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 131.9,
"r_x1": 545.1,
"r_y1": 131.9,
"r_x2": 545.1,
"r_y2": 123.0,
"r_x3": 308.9,
"r_y3": 123.0,
"coord_origin": "TOPLEFT"
},
"text": "are only provided. To compare the performance of our pro-",
"orig": "are only provided. To compare the performance of our pro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 143.9,
"r_x1": 502.0,
"r_y1": 143.9,
"r_x2": 502.0,
"r_y2": 135.0,
"r_x3": 308.9,
"r_y3": 135.0,
"coord_origin": "TOPLEFT"
},
"text": "posed approach, we\u2019ve integrated TableFormer\u2019s",
"orig": "posed approach, we\u2019ve integrated TableFormer\u2019s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 504.5,
"r_y0": 143.7,
"r_x1": 545.1,
"r_y1": 143.7,
"r_x2": 545.1,
"r_y2": 135.1,
"r_x3": 504.5,
"r_y3": 135.1,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox",
"orig": "Cell BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 155.6,
"r_x1": 343.2,
"r_y1": 155.6,
"r_x2": 343.2,
"r_y2": 147.0,
"r_x3": 308.9,
"r_y3": 147.0,
"coord_origin": "TOPLEFT"
},
"text": "Decoder",
"orig": "Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.4,
"r_y0": 155.8,
"r_x1": 545.1,
"r_y1": 155.8,
"r_x2": 545.1,
"r_y2": 146.9,
"r_x3": 346.4,
"r_y3": 146.9,
"coord_origin": "TOPLEFT"
},
"text": "into EDD architecture. As mentioned previously,",
"orig": "into EDD architecture. As mentioned previously,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 167.8,
"r_x1": 446.2,
"r_y1": 167.8,
"r_x2": 446.2,
"r_y2": 158.9,
"r_x3": 308.9,
"r_y3": 158.9,
"coord_origin": "TOPLEFT"
},
"text": "the Structure Decoder provides the",
"orig": "the Structure Decoder provides the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.3,
"r_y0": 167.6,
"r_x1": 525.0,
"r_y1": 167.6,
"r_x2": 525.0,
"r_y2": 159.0,
"r_x3": 448.3,
"r_y3": 159.0,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 527.4,
"r_y0": 167.8,
"r_x1": 545.1,
"r_y1": 167.8,
"r_x2": 545.1,
"r_y2": 158.9,
"r_x3": 527.4,
"r_y3": 158.9,
"coord_origin": "TOPLEFT"
},
"text": "with",
"orig": "with",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 179.8,
"r_x1": 545.1,
"r_y1": 179.8,
"r_x2": 545.1,
"r_y2": 170.8,
"r_x3": 308.9,
"r_y3": 170.8,
"coord_origin": "TOPLEFT"
},
"text": "the features needed to predict the bounding box predictions.",
"orig": "the features needed to predict the bounding box predictions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 191.7,
"r_x1": 432.9,
"r_y1": 191.7,
"r_x2": 432.9,
"r_y2": 182.8,
"r_x3": 308.9,
"r_y3": 182.8,
"coord_origin": "TOPLEFT"
},
"text": "Therefore, the accuracy of the",
"orig": "Therefore, the accuracy of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 436.4,
"r_y0": 191.5,
"r_x1": 510.9,
"r_y1": 191.5,
"r_x2": 510.9,
"r_y2": 182.9,
"r_x3": 436.4,
"r_y3": 182.9,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.7,
"r_y0": 191.7,
"r_x1": 545.1,
"r_y1": 191.7,
"r_x2": 545.1,
"r_y2": 182.8,
"r_x3": 514.7,
"r_y3": 182.8,
"coord_origin": "TOPLEFT"
},
"text": "directly",
"orig": "directly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 203.7,
"r_x1": 431.2,
"r_y1": 203.7,
"r_x2": 431.2,
"r_y2": 194.8,
"r_x3": 308.9,
"r_y3": 194.8,
"coord_origin": "TOPLEFT"
},
"text": "influences the accuracy of the",
"orig": "influences the accuracy of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 434.7,
"r_y0": 203.4,
"r_x1": 514.2,
"r_y1": 203.4,
"r_x2": 514.2,
"r_y2": 194.8,
"r_x3": 434.7,
"r_y3": 194.8,
"coord_origin": "TOPLEFT"
},
"text": "Cell BBox Decoder",
"orig": "Cell BBox Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.2,
"r_y0": 203.7,
"r_x1": 545.1,
"r_y1": 203.7,
"r_x2": 545.1,
"r_y2": 194.8,
"r_x3": 514.2,
"r_y3": 194.8,
"coord_origin": "TOPLEFT"
},
"text": ". If the",
"orig": ". If the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 215.4,
"r_x1": 382.4,
"r_y1": 215.4,
"r_x2": 382.4,
"r_y2": 206.8,
"r_x3": 308.9,
"r_y3": 206.8,
"coord_origin": "TOPLEFT"
},
"text": "Structure Decoder",
"orig": "Structure Decoder",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.1,
"r_y0": 215.6,
"r_x1": 545.1,
"r_y1": 215.6,
"r_x2": 545.1,
"r_y2": 206.7,
"r_x3": 385.1,
"r_y3": 206.7,
"coord_origin": "TOPLEFT"
},
"text": "predicts an extra column, this will result",
"orig": "predicts an extra column, this will result",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 227.6,
"r_x1": 501.7,
"r_y1": 227.6,
"r_x2": 501.7,
"r_y2": 218.7,
"r_x3": 308.9,
"r_y3": 218.7,
"coord_origin": "TOPLEFT"
},
"text": "in an extra column of predicted bounding boxes.",
"orig": "in an extra column of predicted bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "our Cell BBox Decoder accuracy for cells with a class label of 'content' only using the PASCAL VOC mAP metric for pre-processing and post-processing. Note that we do not have post-processing results for SynthTabNet as images are only provided. To compare the performance of our proposed approach, we've integrated TableFormer's Cell BBox Decoder into EDD architecture. As mentioned previously, the Structure Decoder provides the Cell BBox Decoder with the features needed to predict the bounding box predictions. Therefore, the accuracy of the Structure Decoder directly influences the accuracy of the Cell BBox Decoder . If the Structure Decoder predicts an extra column, this will result in an extra column of predicted bounding boxes."
},
{
"label": "table",
"id": 8,
"page_no": 6,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 308.4,
"t": 247.9,
"r": 533.6,
"b": 303.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.3,
"r_y0": 262.6,
"r_x1": 365.3,
"r_y1": 262.6,
"r_x2": 365.3,
"r_y2": 253.7,
"r_x3": 339.3,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 401.0,
"r_y0": 262.6,
"r_x1": 430.9,
"r_y1": 262.6,
"r_x2": 430.9,
"r_y2": 253.7,
"r_x3": 401.0,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 454.1,
"r_y0": 262.6,
"r_x1": 474.6,
"r_y1": 262.6,
"r_x2": 474.6,
"r_y2": 253.7,
"r_x3": 454.1,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "mAP",
"orig": "mAP",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 486.5,
"r_y0": 262.6,
"r_x1": 527.2,
"r_y1": 262.6,
"r_x2": 527.2,
"r_y2": 253.7,
"r_x3": 486.5,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "mAP (PP)",
"orig": "mAP (PP)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.7,
"r_y0": 279.5,
"r_x1": 377.0,
"r_y1": 279.5,
"r_x2": 377.0,
"r_y2": 270.6,
"r_x3": 327.7,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "EDD+BBox",
"orig": "EDD+BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 279.5,
"r_x1": 438.3,
"r_y1": 279.5,
"r_x2": 438.3,
"r_y2": 270.6,
"r_x3": 393.7,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 279.5,
"r_x1": 473.1,
"r_y1": 279.5,
"r_x2": 473.1,
"r_y2": 270.6,
"r_x3": 455.6,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "79.2",
"orig": "79.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.2,
"r_y0": 279.5,
"r_x1": 515.6,
"r_y1": 279.5,
"r_x2": 515.6,
"r_y2": 270.6,
"r_x3": 498.2,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "82.7",
"orig": "82.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 291.5,
"r_x1": 377.9,
"r_y1": 291.5,
"r_x2": 377.9,
"r_y2": 282.6,
"r_x3": 326.8,
"r_y3": 282.6,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 291.5,
"r_x1": 438.3,
"r_y1": 291.5,
"r_x2": 438.3,
"r_y2": 282.6,
"r_x3": 393.7,
"r_y3": 282.6,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 291.4,
"r_x1": 473.1,
"r_y1": 291.4,
"r_x2": 473.1,
"r_y2": 282.5,
"r_x3": 455.6,
"r_y3": 282.5,
"coord_origin": "TOPLEFT"
},
"text": "82.1",
"orig": "82.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.2,
"r_y0": 291.4,
"r_x1": 515.6,
"r_y1": 291.4,
"r_x2": 515.6,
"r_y2": 282.5,
"r_x3": 498.2,
"r_y3": 282.5,
"coord_origin": "TOPLEFT"
},
"text": "86.8",
"orig": "86.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 303.4,
"r_x1": 377.9,
"r_y1": 303.4,
"r_x2": 377.9,
"r_y2": 294.5,
"r_x3": 326.8,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.8,
"r_y0": 303.4,
"r_x1": 442.2,
"r_y1": 303.4,
"r_x2": 442.2,
"r_y2": 294.5,
"r_x3": 389.8,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 303.4,
"r_x1": 473.1,
"r_y1": 303.4,
"r_x2": 473.1,
"r_y2": 294.5,
"r_x3": 455.6,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "87.7",
"orig": "87.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 505.2,
"r_y0": 303.4,
"r_x1": 508.5,
"r_y1": 303.4,
"r_x2": 508.5,
"r_y2": 294.5,
"r_x3": 505.2,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 83,
"label": "text",
"bbox": {
"l": 339.3,
"t": 253.7,
"r": 365.3,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.3,
"r_y0": 262.6,
"r_x1": 365.3,
"r_y1": 262.6,
"r_x2": 365.3,
"r_y2": 253.7,
"r_x3": 339.3,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 401.0,
"t": 253.7,
"r": 430.9,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 401.0,
"r_y0": 262.6,
"r_x1": 430.9,
"r_y1": 262.6,
"r_x2": 430.9,
"r_y2": 253.7,
"r_x3": 401.0,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 454.1,
"t": 253.7,
"r": 474.6,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 454.1,
"r_y0": 262.6,
"r_x1": 474.6,
"r_y1": 262.6,
"r_x2": 474.6,
"r_y2": 253.7,
"r_x3": 454.1,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "mAP",
"orig": "mAP",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 486.5,
"t": 253.7,
"r": 527.2,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 486.5,
"r_y0": 262.6,
"r_x1": 527.2,
"r_y1": 262.6,
"r_x2": 527.2,
"r_y2": 253.7,
"r_x3": 486.5,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "mAP (PP)",
"orig": "mAP (PP)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 327.7,
"t": 270.6,
"r": 377.0,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.7,
"r_y0": 279.5,
"r_x1": 377.0,
"r_y1": 279.5,
"r_x2": 377.0,
"r_y2": 270.6,
"r_x3": 327.7,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "EDD+BBox",
"orig": "EDD+BBox",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 393.7,
"t": 270.6,
"r": 438.3,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 279.5,
"r_x1": 438.3,
"r_y1": 279.5,
"r_x2": 438.3,
"r_y2": 270.6,
"r_x3": 393.7,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 455.6,
"t": 270.6,
"r": 473.1,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 279.5,
"r_x1": 473.1,
"r_y1": 279.5,
"r_x2": 473.1,
"r_y2": 270.6,
"r_x3": 455.6,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "79.2",
"orig": "79.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 498.2,
"t": 270.6,
"r": 515.6,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.2,
"r_y0": 279.5,
"r_x1": 515.6,
"r_y1": 279.5,
"r_x2": 515.6,
"r_y2": 270.6,
"r_x3": 498.2,
"r_y3": 270.6,
"coord_origin": "TOPLEFT"
},
"text": "82.7",
"orig": "82.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 326.8,
"t": 282.6,
"r": 377.9,
"b": 291.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 291.5,
"r_x1": 377.9,
"r_y1": 291.5,
"r_x2": 377.9,
"r_y2": 282.6,
"r_x3": 326.8,
"r_y3": 282.6,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 393.7,
"t": 282.6,
"r": 438.3,
"b": 291.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.7,
"r_y0": 291.5,
"r_x1": 438.3,
"r_y1": 291.5,
"r_x2": 438.3,
"r_y2": 282.6,
"r_x3": 393.7,
"r_y3": 282.6,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 455.6,
"t": 282.5,
"r": 473.1,
"b": 291.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 291.4,
"r_x1": 473.1,
"r_y1": 291.4,
"r_x2": 473.1,
"r_y2": 282.5,
"r_x3": 455.6,
"r_y3": 282.5,
"coord_origin": "TOPLEFT"
},
"text": "82.1",
"orig": "82.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 498.2,
"t": 282.5,
"r": 515.6,
"b": 291.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 498.2,
"r_y0": 291.4,
"r_x1": 515.6,
"r_y1": 291.4,
"r_x2": 515.6,
"r_y2": 282.5,
"r_x3": 498.2,
"r_y3": 282.5,
"coord_origin": "TOPLEFT"
},
"text": "86.8",
"orig": "86.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 326.8,
"t": 294.5,
"r": 377.9,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 303.4,
"r_x1": 377.9,
"r_y1": 303.4,
"r_x2": 377.9,
"r_y2": 294.5,
"r_x3": 326.8,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 389.8,
"t": 294.5,
"r": 442.2,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 389.8,
"r_y0": 303.4,
"r_x1": 442.2,
"r_y1": 303.4,
"r_x2": 442.2,
"r_y2": 294.5,
"r_x3": 389.8,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "SynthTabNet",
"orig": "SynthTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 455.6,
"t": 294.5,
"r": 473.1,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.6,
"r_y0": 303.4,
"r_x1": 473.1,
"r_y1": 303.4,
"r_x2": 473.1,
"r_y2": 294.5,
"r_x3": 455.6,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "87.7",
"orig": "87.7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 505.2,
"t": 294.5,
"r": 508.5,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 505.2,
"r_y0": 303.4,
"r_x1": 508.5,
"r_y1": 303.4,
"r_x2": 508.5,
"r_y2": 294.5,
"r_x3": 505.2,
"r_y3": 294.5,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 4,
"num_cols": 4,
"table_cells": [
{
"bbox": {
"l": 339.3,
"t": 253.7,
"r": 365.3,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Model",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 401.0,
"t": 253.7,
"r": 430.9,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Dataset",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 454.1,
"t": 253.7,
"r": 474.6,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "mAP",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 486.5,
"t": 253.7,
"r": 527.2,
"b": 262.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "mAP (PP)",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 327.7,
"t": 270.6,
"r": 377.0,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD+BBox",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 393.7,
"t": 270.6,
"r": 438.3,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PubTabNet",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 455.6,
"t": 270.6,
"r": 473.1,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "79.2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 498.2,
"t": 270.6,
"r": 515.6,
"b": 279.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "82.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 326.8,
"t": 282.6,
"r": 377.9,
"b": 291.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 393.7,
"t": 282.6,
"r": 438.3,
"b": 291.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "PubTabNet",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 455.6,
"t": 282.5,
"r": 473.1,
"b": 291.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "82.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 498.2,
"t": 282.5,
"r": 515.6,
"b": 291.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "86.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 326.8,
"t": 294.5,
"r": 377.9,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 389.8,
"t": 294.5,
"r": 442.2,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "SynthTabNet",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 455.6,
"t": 294.5,
"r": 473.1,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "87.7",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 505.2,
"t": 294.5,
"r": 508.5,
"b": 303.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 12,
"page_no": 6,
"cluster": {
"id": 12,
"label": "caption",
"bbox": {
"l": 308.9,
"t": 316.4,
"r": 545.1,
"b": 337.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 325.4,
"r_x1": 341.5,
"r_y1": 325.4,
"r_x2": 341.5,
"r_y2": 316.4,
"r_x3": 308.9,
"r_y3": 316.4,
"coord_origin": "TOPLEFT"
},
"text": "Table 3:",
"orig": "Table 3:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 348.6,
"r_y0": 325.4,
"r_x1": 545.1,
"r_y1": 325.4,
"r_x2": 545.1,
"r_y2": 316.4,
"r_x3": 348.6,
"r_y3": 316.4,
"coord_origin": "TOPLEFT"
},
"text": "Cell Bounding Box detection results on PubTab-",
"orig": "Cell Bounding Box detection results on PubTab-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 337.3,
"r_x1": 475.0,
"r_y1": 337.3,
"r_x2": 475.0,
"r_y2": 328.4,
"r_x3": 308.9,
"r_y3": 328.4,
"coord_origin": "TOPLEFT"
},
"text": "Net, and FinTabNet. PP: Post-processing.",
"orig": "Net, and FinTabNet. PP: Post-processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Table 3: Cell Bounding Box detection results on PubTabNet, and FinTabNet. PP: Post-processing."
},
{
"label": "text",
"id": 4,
"page_no": 6,
"cluster": {
"id": 4,
"label": "text",
"bbox": {
"l": 308.9,
"t": 367.7,
"r": 545.1,
"b": 520.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 376.6,
"r_x1": 378.9,
"r_y1": 376.6,
"r_x2": 378.9,
"r_y2": 367.7,
"r_x3": 320.8,
"r_y3": 367.7,
"coord_origin": "TOPLEFT"
},
"text": "Cell Content.",
"orig": "Cell Content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 387.1,
"r_y0": 376.7,
"r_x1": 545.1,
"r_y1": 376.7,
"r_x2": 545.1,
"r_y2": 367.8,
"r_x3": 387.1,
"r_y3": 367.8,
"coord_origin": "TOPLEFT"
},
"text": "In this section, we evaluate the entire",
"orig": "In this section, we evaluate the entire",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 388.7,
"r_x1": 487.2,
"r_y1": 388.7,
"r_x2": 487.2,
"r_y2": 379.8,
"r_x3": 308.9,
"r_y3": 379.8,
"coord_origin": "TOPLEFT"
},
"text": "pipeline of recovering a table with content.",
"orig": "pipeline of recovering a table with content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 494.0,
"r_y0": 388.7,
"r_x1": 545.1,
"r_y1": 388.7,
"r_x2": 545.1,
"r_y2": 379.8,
"r_x3": 494.0,
"r_y3": 379.8,
"coord_origin": "TOPLEFT"
},
"text": "Here we put",
"orig": "Here we put",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 400.6,
"r_x1": 545.1,
"r_y1": 400.6,
"r_x2": 545.1,
"r_y2": 391.7,
"r_x3": 308.9,
"r_y3": 391.7,
"coord_origin": "TOPLEFT"
},
"text": "our approach to test by capitalizing on extracting content",
"orig": "our approach to test by capitalizing on extracting content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 412.6,
"r_x1": 545.1,
"r_y1": 412.6,
"r_x2": 545.1,
"r_y2": 403.7,
"r_x3": 308.9,
"r_y3": 403.7,
"coord_origin": "TOPLEFT"
},
"text": "from the PDF cells rather than decoding from images. Tab.",
"orig": "from the PDF cells rather than decoding from images. Tab.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 424.5,
"r_x1": 314.1,
"r_y1": 424.5,
"r_x2": 314.1,
"r_y2": 415.6,
"r_x3": 308.9,
"r_y3": 415.6,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 316.7,
"r_y0": 424.5,
"r_x1": 545.1,
"r_y1": 424.5,
"r_x2": 545.1,
"r_y2": 415.6,
"r_x3": 316.7,
"r_y3": 415.6,
"coord_origin": "TOPLEFT"
},
"text": "shows the TEDs score of HTML code representing the",
"orig": "shows the TEDs score of HTML code representing the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 436.5,
"r_x1": 545.1,
"r_y1": 436.5,
"r_x2": 545.1,
"r_y2": 427.6,
"r_x3": 308.9,
"r_y3": 427.6,
"coord_origin": "TOPLEFT"
},
"text": "structure of the table along with the content inserted in the",
"orig": "structure of the table along with the content inserted in the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 448.4,
"r_x1": 545.1,
"r_y1": 448.4,
"r_x2": 545.1,
"r_y2": 439.5,
"r_x3": 308.9,
"r_y3": 439.5,
"coord_origin": "TOPLEFT"
},
"text": "data cell and compared with the ground-truth. Our method",
"orig": "data cell and compared with the ground-truth. Our method",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 460.4,
"r_x1": 350.2,
"r_y1": 460.4,
"r_x2": 350.2,
"r_y2": 451.5,
"r_x3": 308.9,
"r_y3": 451.5,
"coord_origin": "TOPLEFT"
},
"text": "achieved a",
"orig": "achieved a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.2,
"r_y0": 460.3,
"r_x1": 374.6,
"r_y1": 460.3,
"r_x2": 374.6,
"r_y2": 451.4,
"r_x3": 352.2,
"r_y3": 451.4,
"coord_origin": "TOPLEFT"
},
"text": "5.3%",
"orig": "5.3%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 376.5,
"r_y0": 460.4,
"r_x1": 545.1,
"r_y1": 460.4,
"r_x2": 545.1,
"r_y2": 451.5,
"r_x3": 376.5,
"r_y3": 451.5,
"coord_origin": "TOPLEFT"
},
"text": "increase over the state-of-the-art, and com-",
"orig": "increase over the state-of-the-art, and com-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 472.3,
"r_x1": 545.1,
"r_y1": 472.3,
"r_x2": 545.1,
"r_y2": 463.4,
"r_x3": 308.9,
"r_y3": 463.4,
"coord_origin": "TOPLEFT"
},
"text": "mercial solutions. We believe our scores would be higher",
"orig": "mercial solutions. We believe our scores would be higher",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 484.3,
"r_x1": 545.1,
"r_y1": 484.3,
"r_x2": 545.1,
"r_y2": 475.4,
"r_x3": 308.9,
"r_y3": 475.4,
"coord_origin": "TOPLEFT"
},
"text": "if the HTML ground-truth matched the extracted PDF cell",
"orig": "if the HTML ground-truth matched the extracted PDF cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 496.3,
"r_x1": 545.1,
"r_y1": 496.3,
"r_x2": 545.1,
"r_y2": 487.4,
"r_x3": 308.9,
"r_y3": 487.4,
"coord_origin": "TOPLEFT"
},
"text": "content. Unfortunately, there are small discrepancies such",
"orig": "content. Unfortunately, there are small discrepancies such",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 508.2,
"r_x1": 545.1,
"r_y1": 508.2,
"r_x2": 545.1,
"r_y2": 499.3,
"r_x3": 308.9,
"r_y3": 499.3,
"coord_origin": "TOPLEFT"
},
"text": "as spacings around words or special characters with various",
"orig": "as spacings around words or special characters with various",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 520.2,
"r_x1": 405.7,
"r_y1": 520.2,
"r_x2": 405.7,
"r_y2": 511.3,
"r_x3": 308.9,
"r_y3": 511.3,
"coord_origin": "TOPLEFT"
},
"text": "unicode representations.",
"orig": "unicode representations.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Cell Content. In this section, we evaluate the entire pipeline of recovering a table with content. Here we put our approach to test by capitalizing on extracting content from the PDF cells rather than decoding from images. Tab. 4 shows the TEDs score of HTML code representing the structure of the table along with the content inserted in the data cell and compared with the ground-truth. Our method achieved a 5.3% increase over the state-of-the-art, and commercial solutions. We believe our scores would be higher if the HTML ground-truth matched the extracted PDF cell content. Unfortunately, there are small discrepancies such as spacings around words or special characters with various unicode representations."
},
{
"label": "table",
"id": 5,
"page_no": 6,
"cluster": {
"id": 5,
"label": "table",
"bbox": {
"l": 333.0,
"t": 540.3,
"r": 520.9,
"b": 643.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 358.0,
"r_y0": 561.1,
"r_x1": 384.0,
"r_y1": 561.1,
"r_x2": 384.0,
"r_y2": 552.2,
"r_x3": 358.0,
"r_y3": 552.2,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.0,
"r_y0": 555.2,
"r_x1": 473.9,
"r_y1": 555.2,
"r_x2": 473.9,
"r_y2": 546.3,
"r_x3": 449.0,
"r_y3": 546.3,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.5,
"r_y0": 567.1,
"r_x1": 436.7,
"r_y1": 567.1,
"r_x2": 436.7,
"r_y2": 558.2,
"r_x3": 408.5,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.7,
"r_y0": 567.1,
"r_x1": 485.1,
"r_y1": 567.1,
"r_x2": 485.1,
"r_y2": 558.2,
"r_x3": 448.7,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.4,
"r_y0": 567.1,
"r_x1": 512.1,
"r_y1": 567.1,
"r_x2": 512.1,
"r_y2": 558.2,
"r_x3": 499.4,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.7,
"r_y0": 584.1,
"r_x1": 384.4,
"r_y1": 584.1,
"r_x2": 384.4,
"r_y2": 575.2,
"r_x3": 357.7,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "Tabula",
"orig": "Tabula",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 584.1,
"r_x1": 431.3,
"r_y1": 584.1,
"r_x2": 431.3,
"r_y2": 575.2,
"r_x3": 413.9,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "78.0",
"orig": "78.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 584.1,
"r_x1": 475.6,
"r_y1": 584.1,
"r_x2": 475.6,
"r_y2": 575.2,
"r_x3": 458.2,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "57.8",
"orig": "57.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 584.1,
"r_x1": 514.5,
"r_y1": 584.1,
"r_x2": 514.5,
"r_y2": 575.2,
"r_x3": 497.0,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "67.9",
"orig": "67.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 350.7,
"r_y0": 596.0,
"r_x1": 391.3,
"r_y1": 596.0,
"r_x2": 391.3,
"r_y2": 587.1,
"r_x3": 350.7,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "Traprange",
"orig": "Traprange",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 596.0,
"r_x1": 431.3,
"r_y1": 596.0,
"r_x2": 431.3,
"r_y2": 587.1,
"r_x3": 413.9,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "60.8",
"orig": "60.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 596.0,
"r_x1": 475.6,
"r_y1": 596.0,
"r_x2": 475.6,
"r_y2": 587.1,
"r_x3": 458.2,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "49.9",
"orig": "49.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 596.0,
"r_x1": 514.5,
"r_y1": 596.0,
"r_x2": 514.5,
"r_y2": 587.1,
"r_x3": 497.0,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "55.4",
"orig": "55.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.1,
"r_y0": 608.0,
"r_x1": 387.9,
"r_y1": 608.0,
"r_x2": 387.9,
"r_y2": 599.1,
"r_x3": 354.1,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "Camelot",
"orig": "Camelot",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 608.0,
"r_x1": 431.3,
"r_y1": 608.0,
"r_x2": 431.3,
"r_y2": 599.1,
"r_x3": 413.9,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "80.0",
"orig": "80.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 608.0,
"r_x1": 475.6,
"r_y1": 608.0,
"r_x2": 475.6,
"r_y2": 599.1,
"r_x3": 458.2,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "66.0",
"orig": "66.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 608.0,
"r_x1": 514.5,
"r_y1": 608.0,
"r_x2": 514.5,
"r_y2": 599.1,
"r_x3": 497.0,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "73.0",
"orig": "73.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.6,
"r_y0": 619.9,
"r_x1": 395.5,
"r_y1": 619.9,
"r_x2": 395.5,
"r_y2": 611.0,
"r_x3": 346.6,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "Acrobat Pro",
"orig": "Acrobat Pro",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 619.9,
"r_x1": 431.3,
"r_y1": 619.9,
"r_x2": 431.3,
"r_y2": 611.0,
"r_x3": 413.9,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "68.9",
"orig": "68.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 619.9,
"r_x1": 475.6,
"r_y1": 619.9,
"r_x2": 475.6,
"r_y2": 611.0,
"r_x3": 458.2,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "61.8",
"orig": "61.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 619.9,
"r_x1": 514.5,
"r_y1": 619.9,
"r_x2": 514.5,
"r_y2": 611.0,
"r_x3": 497.0,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "65.3",
"orig": "65.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.8,
"r_y0": 631.9,
"r_x1": 381.3,
"r_y1": 631.9,
"r_x2": 381.3,
"r_y2": 623.0,
"r_x3": 360.8,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 631.9,
"r_x1": 431.3,
"r_y1": 631.9,
"r_x2": 431.3,
"r_y2": 623.0,
"r_x3": 413.9,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "91.2",
"orig": "91.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 631.9,
"r_x1": 475.6,
"r_y1": 631.9,
"r_x2": 475.6,
"r_y2": 623.0,
"r_x3": 458.2,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "85.4",
"orig": "85.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 631.9,
"r_x1": 514.5,
"r_y1": 631.9,
"r_x2": 514.5,
"r_y2": 623.0,
"r_x3": 497.0,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "88.3",
"orig": "88.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.5,
"r_y0": 643.8,
"r_x1": 396.6,
"r_y1": 643.8,
"r_x2": 396.6,
"r_y2": 634.9,
"r_x3": 345.5,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 643.8,
"r_x1": 431.3,
"r_y1": 643.8,
"r_x2": 431.3,
"r_y2": 634.9,
"r_x3": 413.9,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "95.4",
"orig": "95.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 643.8,
"r_x1": 475.6,
"r_y1": 643.8,
"r_x2": 475.6,
"r_y2": 634.9,
"r_x3": 458.2,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "90.1",
"orig": "90.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 643.8,
"r_x1": 514.5,
"r_y1": 643.8,
"r_x2": 514.5,
"r_y2": 634.8,
"r_x3": 497.0,
"r_y3": 634.8,
"coord_origin": "TOPLEFT"
},
"text": "93.6",
"orig": "93.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 99,
"label": "text",
"bbox": {
"l": 358.0,
"t": 552.2,
"r": 384.0,
"b": 561.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 358.0,
"r_y0": 561.1,
"r_x1": 384.0,
"r_y1": 561.1,
"r_x2": 384.0,
"r_y2": 552.2,
"r_x3": 358.0,
"r_y3": 552.2,
"coord_origin": "TOPLEFT"
},
"text": "Model",
"orig": "Model",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 449.0,
"t": 546.3,
"r": 473.9,
"b": 555.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 449.0,
"r_y0": 555.2,
"r_x1": 473.9,
"r_y1": 555.2,
"r_x2": 473.9,
"r_y2": 546.3,
"r_x3": 449.0,
"r_y3": 546.3,
"coord_origin": "TOPLEFT"
},
"text": "TEDS",
"orig": "TEDS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 408.5,
"t": 558.2,
"r": 436.7,
"b": 567.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.5,
"r_y0": 567.1,
"r_x1": 436.7,
"r_y1": 567.1,
"r_x2": 436.7,
"r_y2": 558.2,
"r_x3": 408.5,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 448.7,
"t": 558.2,
"r": 485.1,
"b": 567.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.7,
"r_y0": 567.1,
"r_x1": 485.1,
"r_y1": 567.1,
"r_x2": 485.1,
"r_y2": 558.2,
"r_x3": 448.7,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 499.4,
"t": 558.2,
"r": 512.1,
"b": 567.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 499.4,
"r_y0": 567.1,
"r_x1": 512.1,
"r_y1": 567.1,
"r_x2": 512.1,
"r_y2": 558.2,
"r_x3": 499.4,
"r_y3": 558.2,
"coord_origin": "TOPLEFT"
},
"text": "All",
"orig": "All",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 357.7,
"t": 575.2,
"r": 384.4,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.7,
"r_y0": 584.1,
"r_x1": 384.4,
"r_y1": 584.1,
"r_x2": 384.4,
"r_y2": 575.2,
"r_x3": 357.7,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "Tabula",
"orig": "Tabula",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 105,
"label": "text",
"bbox": {
"l": 413.9,
"t": 575.2,
"r": 431.3,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 584.1,
"r_x1": 431.3,
"r_y1": 584.1,
"r_x2": 431.3,
"r_y2": 575.2,
"r_x3": 413.9,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "78.0",
"orig": "78.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 106,
"label": "text",
"bbox": {
"l": 458.2,
"t": 575.2,
"r": 475.6,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 584.1,
"r_x1": 475.6,
"r_y1": 584.1,
"r_x2": 475.6,
"r_y2": 575.2,
"r_x3": 458.2,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "57.8",
"orig": "57.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 107,
"label": "text",
"bbox": {
"l": 497.0,
"t": 575.2,
"r": 514.5,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 584.1,
"r_x1": 514.5,
"r_y1": 584.1,
"r_x2": 514.5,
"r_y2": 575.2,
"r_x3": 497.0,
"r_y3": 575.2,
"coord_origin": "TOPLEFT"
},
"text": "67.9",
"orig": "67.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 108,
"label": "text",
"bbox": {
"l": 350.7,
"t": 587.1,
"r": 391.3,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 350.7,
"r_y0": 596.0,
"r_x1": 391.3,
"r_y1": 596.0,
"r_x2": 391.3,
"r_y2": 587.1,
"r_x3": 350.7,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "Traprange",
"orig": "Traprange",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 109,
"label": "text",
"bbox": {
"l": 413.9,
"t": 587.1,
"r": 431.3,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 596.0,
"r_x1": 431.3,
"r_y1": 596.0,
"r_x2": 431.3,
"r_y2": 587.1,
"r_x3": 413.9,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "60.8",
"orig": "60.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 110,
"label": "text",
"bbox": {
"l": 458.2,
"t": 587.1,
"r": 475.6,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 596.0,
"r_x1": 475.6,
"r_y1": 596.0,
"r_x2": 475.6,
"r_y2": 587.1,
"r_x3": 458.2,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "49.9",
"orig": "49.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 111,
"label": "text",
"bbox": {
"l": 497.0,
"t": 587.1,
"r": 514.5,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 596.0,
"r_x1": 514.5,
"r_y1": 596.0,
"r_x2": 514.5,
"r_y2": 587.1,
"r_x3": 497.0,
"r_y3": 587.1,
"coord_origin": "TOPLEFT"
},
"text": "55.4",
"orig": "55.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 112,
"label": "text",
"bbox": {
"l": 354.1,
"t": 599.1,
"r": 387.9,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 354.1,
"r_y0": 608.0,
"r_x1": 387.9,
"r_y1": 608.0,
"r_x2": 387.9,
"r_y2": 599.1,
"r_x3": 354.1,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "Camelot",
"orig": "Camelot",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 113,
"label": "text",
"bbox": {
"l": 413.9,
"t": 599.1,
"r": 431.3,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 608.0,
"r_x1": 431.3,
"r_y1": 608.0,
"r_x2": 431.3,
"r_y2": 599.1,
"r_x3": 413.9,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "80.0",
"orig": "80.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 114,
"label": "text",
"bbox": {
"l": 458.2,
"t": 599.1,
"r": 475.6,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 608.0,
"r_x1": 475.6,
"r_y1": 608.0,
"r_x2": 475.6,
"r_y2": 599.1,
"r_x3": 458.2,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "66.0",
"orig": "66.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 115,
"label": "text",
"bbox": {
"l": 497.0,
"t": 599.1,
"r": 514.5,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 608.0,
"r_x1": 514.5,
"r_y1": 608.0,
"r_x2": 514.5,
"r_y2": 599.1,
"r_x3": 497.0,
"r_y3": 599.1,
"coord_origin": "TOPLEFT"
},
"text": "73.0",
"orig": "73.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 116,
"label": "text",
"bbox": {
"l": 346.6,
"t": 611.0,
"r": 395.5,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.6,
"r_y0": 619.9,
"r_x1": 395.5,
"r_y1": 619.9,
"r_x2": 395.5,
"r_y2": 611.0,
"r_x3": 346.6,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "Acrobat Pro",
"orig": "Acrobat Pro",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 117,
"label": "text",
"bbox": {
"l": 413.9,
"t": 611.0,
"r": 431.3,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 619.9,
"r_x1": 431.3,
"r_y1": 619.9,
"r_x2": 431.3,
"r_y2": 611.0,
"r_x3": 413.9,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "68.9",
"orig": "68.9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 118,
"label": "text",
"bbox": {
"l": 458.2,
"t": 611.0,
"r": 475.6,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 619.9,
"r_x1": 475.6,
"r_y1": 619.9,
"r_x2": 475.6,
"r_y2": 611.0,
"r_x3": 458.2,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "61.8",
"orig": "61.8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 119,
"label": "text",
"bbox": {
"l": 497.0,
"t": 611.0,
"r": 514.5,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 619.9,
"r_x1": 514.5,
"r_y1": 619.9,
"r_x2": 514.5,
"r_y2": 611.0,
"r_x3": 497.0,
"r_y3": 611.0,
"coord_origin": "TOPLEFT"
},
"text": "65.3",
"orig": "65.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 120,
"label": "text",
"bbox": {
"l": 360.8,
"t": 623.0,
"r": 381.3,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.8,
"r_y0": 631.9,
"r_x1": 381.3,
"r_y1": 631.9,
"r_x2": 381.3,
"r_y2": 623.0,
"r_x3": 360.8,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "EDD",
"orig": "EDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 121,
"label": "text",
"bbox": {
"l": 413.9,
"t": 623.0,
"r": 431.3,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 631.9,
"r_x1": 431.3,
"r_y1": 631.9,
"r_x2": 431.3,
"r_y2": 623.0,
"r_x3": 413.9,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "91.2",
"orig": "91.2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 122,
"label": "text",
"bbox": {
"l": 458.2,
"t": 623.0,
"r": 475.6,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 631.9,
"r_x1": 475.6,
"r_y1": 631.9,
"r_x2": 475.6,
"r_y2": 623.0,
"r_x3": 458.2,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "85.4",
"orig": "85.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 123,
"label": "text",
"bbox": {
"l": 497.0,
"t": 623.0,
"r": 514.5,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 631.9,
"r_x1": 514.5,
"r_y1": 631.9,
"r_x2": 514.5,
"r_y2": 623.0,
"r_x3": 497.0,
"r_y3": 623.0,
"coord_origin": "TOPLEFT"
},
"text": "88.3",
"orig": "88.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 124,
"label": "text",
"bbox": {
"l": 345.5,
"t": 634.9,
"r": 396.6,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.5,
"r_y0": 643.8,
"r_x1": 396.6,
"r_y1": 643.8,
"r_x2": 396.6,
"r_y2": 634.9,
"r_x3": 345.5,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer",
"orig": "TableFormer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 125,
"label": "text",
"bbox": {
"l": 413.9,
"t": 634.9,
"r": 431.3,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 413.9,
"r_y0": 643.8,
"r_x1": 431.3,
"r_y1": 643.8,
"r_x2": 431.3,
"r_y2": 634.9,
"r_x3": 413.9,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "95.4",
"orig": "95.4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 126,
"label": "text",
"bbox": {
"l": 458.2,
"t": 634.9,
"r": 475.6,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 458.2,
"r_y0": 643.8,
"r_x1": 475.6,
"r_y1": 643.8,
"r_x2": 475.6,
"r_y2": 634.9,
"r_x3": 458.2,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "90.1",
"orig": "90.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 127,
"label": "text",
"bbox": {
"l": 497.0,
"t": 634.8,
"r": 514.5,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 497.0,
"r_y0": 643.8,
"r_x1": 514.5,
"r_y1": 643.8,
"r_x2": 514.5,
"r_y2": 634.8,
"r_x3": 497.0,
"r_y3": 634.8,
"coord_origin": "TOPLEFT"
},
"text": "93.6",
"orig": "93.6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"fcel",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 7,
"num_cols": 4,
"table_cells": [
{
"bbox": {
"l": 358.0,
"t": 552.2,
"r": 384.0,
"b": 561.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Model",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 449.0,
"t": 546.3,
"r": 473.9,
"b": 555.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "TEDS Complex",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 408.5,
"t": 558.2,
"r": 436.7,
"b": 567.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "Simple",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 499.4,
"t": 558.2,
"r": 512.1,
"b": 567.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "All",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 357.7,
"t": 575.2,
"r": 384.4,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Tabula",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 575.2,
"r": 431.3,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "78.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.2,
"t": 575.2,
"r": 475.6,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "57.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.0,
"t": 575.2,
"r": 514.5,
"b": 584.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "67.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 350.7,
"t": 587.1,
"r": 391.3,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Traprange",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 587.1,
"r": 431.3,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "60.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.2,
"t": 587.1,
"r": 475.6,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "49.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.0,
"t": 587.1,
"r": 514.5,
"b": 596.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "55.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 354.1,
"t": 599.1,
"r": 387.9,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Camelot",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 599.1,
"r": 431.3,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "80.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.2,
"t": 599.1,
"r": 475.6,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "66.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.0,
"t": 599.1,
"r": 514.5,
"b": 608.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "73.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 346.6,
"t": 611.0,
"r": 395.5,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Acrobat Pro",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 611.0,
"r": 431.3,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "68.9",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.2,
"t": 611.0,
"r": 475.6,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "61.8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.0,
"t": 611.0,
"r": 514.5,
"b": 619.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "65.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 360.8,
"t": 623.0,
"r": 381.3,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "EDD",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 623.0,
"r": 431.3,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "91.2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.2,
"t": 623.0,
"r": 475.6,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "85.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.0,
"t": 623.0,
"r": 514.5,
"b": 631.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "88.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 345.5,
"t": 634.9,
"r": 396.6,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "TableFormer",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 413.9,
"t": 634.9,
"r": 431.3,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "95.4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 458.2,
"t": 634.9,
"r": 475.6,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "90.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 497.0,
"t": 634.8,
"r": 514.5,
"b": 643.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "93.6",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 11,
"page_no": 6,
"cluster": {
"id": 11,
"label": "caption",
"bbox": {
"l": 308.9,
"t": 656.9,
"r": 545.1,
"b": 689.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 212,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 665.8,
"r_x1": 341.7,
"r_y1": 665.8,
"r_x2": 341.7,
"r_y2": 656.9,
"r_x3": 308.9,
"r_y3": 656.9,
"coord_origin": "TOPLEFT"
},
"text": "Table 4:",
"orig": "Table 4:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 213,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 349.6,
"r_y0": 665.8,
"r_x1": 545.1,
"r_y1": 665.8,
"r_x2": 545.1,
"r_y2": 656.9,
"r_x3": 349.6,
"r_y3": 656.9,
"coord_origin": "TOPLEFT"
},
"text": "Results of structure with content retrieved using",
"orig": "Results of structure with content retrieved using",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 214,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 677.7,
"r_x1": 545.1,
"r_y1": 677.7,
"r_x2": 545.1,
"r_y2": 668.8,
"r_x3": 308.9,
"r_y3": 668.8,
"coord_origin": "TOPLEFT"
},
"text": "cell detection on PubTabNet. In all cases the input is PDF",
"orig": "cell detection on PubTabNet. In all cases the input is PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 215,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 689.7,
"r_x1": 435.0,
"r_y1": 689.7,
"r_x2": 435.0,
"r_y2": 680.8,
"r_x3": 308.9,
"r_y3": 680.8,
"coord_origin": "TOPLEFT"
},
"text": "documents with cropped tables.",
"orig": "documents with cropped tables.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Table 4: Results of structure with content retrieved using cell detection on PubTabNet. In all cases the input is PDF documents with cropped tables."
}
],
"headers": [
{
"label": "page_footer",
"id": 14,
"page_no": 6,
"cluster": {
"id": 14,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 216,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "7"
}
]
}
},
{
"page_no": 7,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.8,
"r_y0": 216.1,
"r_x1": 62.2,
"r_y1": 216.1,
"r_x2": 62.2,
"r_y2": 208.2,
"r_x3": 53.8,
"r_y3": 208.2,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.4,
"r_y0": 216.1,
"r_x1": 385.9,
"r_y1": 216.1,
"r_x2": 385.9,
"r_y2": 208.2,
"r_x3": 66.4,
"r_y3": 208.2,
"coord_origin": "TOPLEFT"
},
"text": "Structure predicted by TableFormer, with superimposed matched PDF cell text:",
"orig": "Structure predicted by TableFormer, with superimposed matched PDF cell text:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.8,
"r_y0": 102.2,
"r_x1": 284.3,
"r_y1": 102.2,
"r_x2": 284.3,
"r_y2": 94.3,
"r_x3": 53.8,
"r_y3": 94.3,
"coord_origin": "TOPLEFT"
},
"text": "Japanese language (previously unseen by TableFormer):",
"orig": "Japanese language (previously unseen by TableFormer):",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 304.8,
"r_y0": 102.2,
"r_x1": 431.1,
"r_y1": 102.2,
"r_x2": 431.1,
"r_y2": 94.3,
"r_x3": 304.8,
"r_y3": 94.3,
"coord_origin": "TOPLEFT"
},
"text": "Example table from FinTabNet:",
"orig": "Example table from FinTabNet:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.3,
"r_y0": 86.6,
"r_x1": 61.6,
"r_y1": 86.6,
"r_x2": 61.6,
"r_y2": 78.7,
"r_x3": 53.3,
"r_y3": 78.7,
"coord_origin": "TOPLEFT"
},
"text": "a.",
"orig": "a.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.7,
"r_y0": 86.6,
"r_x1": 499.6,
"r_y1": 86.6,
"r_x2": 499.6,
"r_y2": 78.7,
"r_x3": 65.7,
"r_y3": 78.7,
"coord_origin": "TOPLEFT"
},
"text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells",
"orig": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.9,
"r_y0": 226.4,
"r_x1": 241.0,
"r_y1": 226.4,
"r_x2": 241.0,
"r_y2": 222.2,
"r_x3": 209.9,
"r_y3": 222.2,
"coord_origin": "TOPLEFT"
},
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.8,
"r_y0": 226.4,
"r_x1": 284.5,
"r_y1": 226.4,
"r_x2": 284.5,
"r_y2": 222.2,
"r_x3": 263.8,
"r_y3": 222.2,
"coord_origin": "TOPLEFT"
},
"text": "\u53c2\u8003\u6587\u732e",
"orig": "\u53c2\u8003\u6587\u732e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.2,
"r_y0": 233.8,
"r_x1": 120.6,
"r_y1": 233.8,
"r_x2": 120.6,
"r_y2": 229.7,
"r_x3": 110.2,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u51fa\u5178",
"orig": "\u51fa\u5178",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.4,
"r_y0": 233.8,
"r_x1": 196.1,
"r_y1": 233.8,
"r_x2": 196.1,
"r_y2": 229.7,
"r_x3": 175.4,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u30d5\u30a1\u30a4\u30eb",
"orig": "\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.1,
"r_y0": 233.8,
"r_x1": 201.3,
"r_y1": 233.8,
"r_x2": 201.3,
"r_y2": 229.7,
"r_x3": 196.1,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u6570",
"orig": "\u6570",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.6,
"r_y0": 233.8,
"r_x1": 220.0,
"r_y1": 233.8,
"r_x2": 220.0,
"r_y2": 229.7,
"r_x3": 209.6,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.2,
"r_y0": 233.8,
"r_x1": 244.8,
"r_y1": 233.8,
"r_x2": 244.8,
"r_y2": 229.7,
"r_x3": 229.2,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.1,
"r_y0": 233.8,
"r_x1": 266.5,
"r_y1": 233.8,
"r_x2": 266.5,
"r_y2": 229.7,
"r_x3": 256.1,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.4,
"r_y0": 233.8,
"r_x1": 293.9,
"r_y1": 233.8,
"r_x2": 293.9,
"r_y2": 229.7,
"r_x3": 278.4,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 240.8,
"r_x1": 162.7,
"r_y1": 240.8,
"r_x2": 162.7,
"r_y2": 236.4,
"r_x3": 55.5,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "Association for Computational Linguistics(ACL2003)",
"orig": "Association for Computational Linguistics(ACL2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 240.8,
"r_x1": 189.6,
"r_y1": 240.8,
"r_x2": 189.6,
"r_y2": 236.4,
"r_x3": 184.4,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 240.8,
"r_x1": 214.2,
"r_y1": 240.8,
"r_x2": 214.2,
"r_y2": 236.4,
"r_x3": 209.0,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.9,
"r_y0": 240.8,
"r_x1": 237.5,
"r_y1": 240.8,
"r_x2": 237.5,
"r_y2": 236.4,
"r_x3": 234.9,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 240.8,
"r_x1": 264.6,
"r_y1": 240.8,
"r_x2": 264.6,
"r_y2": 236.4,
"r_x3": 256.9,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.1,
"r_y0": 240.8,
"r_x1": 286.6,
"r_y1": 240.8,
"r_x2": 286.6,
"r_y2": 236.4,
"r_x3": 284.1,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 247.0,
"r_x1": 139.7,
"r_y1": 247.0,
"r_x2": 139.7,
"r_y2": 242.6,
"r_x3": 55.5,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "Computational Linguistics(COLING2002)",
"orig": "Computational Linguistics(COLING2002)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 247.0,
"r_x1": 190.9,
"r_y1": 247.0,
"r_x2": 190.9,
"r_y2": 242.6,
"r_x3": 183.1,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 247.0,
"r_x1": 215.4,
"r_y1": 247.0,
"r_x2": 215.4,
"r_y2": 242.6,
"r_x3": 207.7,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.9,
"r_y0": 247.0,
"r_x1": 237.5,
"r_y1": 247.0,
"r_x2": 237.5,
"r_y2": 242.6,
"r_x3": 234.9,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 247.0,
"r_x1": 264.6,
"r_y1": 247.0,
"r_x2": 264.6,
"r_y2": 242.6,
"r_x3": 256.9,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.1,
"r_y0": 247.0,
"r_x1": 286.6,
"r_y1": 247.0,
"r_x2": 286.6,
"r_y2": 242.6,
"r_x3": 284.1,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 254.0,
"r_x1": 97.0,
"r_y1": 254.0,
"r_x2": 97.0,
"r_y2": 249.8,
"r_x3": 55.5,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 92.7,
"r_y0": 253.9,
"r_x1": 103.0,
"r_y1": 253.9,
"r_x2": 103.0,
"r_y2": 249.6,
"r_x3": 92.7,
"r_y3": 249.6,
"coord_origin": "TOPLEFT"
},
"text": "2003",
"orig": "2003",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.0,
"r_y0": 254.0,
"r_x1": 129.0,
"r_y1": 254.0,
"r_x2": 129.0,
"r_y2": 249.8,
"r_x3": 103.0,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"orig": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 253.2,
"r_x1": 190.9,
"r_y1": 253.2,
"r_x2": 190.9,
"r_y2": 248.8,
"r_x3": 183.1,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 253.2,
"r_x1": 212.9,
"r_y1": 253.2,
"r_x2": 212.9,
"r_y2": 248.8,
"r_x3": 210.3,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 253.2,
"r_x1": 240.0,
"r_y1": 253.2,
"r_x2": 240.0,
"r_y2": 248.8,
"r_x3": 232.3,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "142",
"orig": "142",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 253.2,
"r_x1": 264.6,
"r_y1": 253.2,
"r_x2": 264.6,
"r_y2": 248.8,
"r_x3": 256.9,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "223",
"orig": "223",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 253.2,
"r_x1": 289.2,
"r_y1": 253.2,
"r_x2": 289.2,
"r_y2": 248.8,
"r_x3": 281.5,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 261.5,
"r_x1": 91.8,
"r_y1": 261.5,
"r_x2": 91.8,
"r_y2": 257.3,
"r_x3": 55.5,
"r_y3": 257.3,
"coord_origin": "TOPLEFT"
},
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.1,
"r_y0": 261.4,
"r_x1": 93.2,
"r_y1": 261.4,
"r_x2": 93.2,
"r_y2": 257.1,
"r_x3": 88.1,
"r_y3": 257.1,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.2,
"r_y0": 261.5,
"r_x1": 119.1,
"r_y1": 261.5,
"r_x2": 119.1,
"r_y2": 257.3,
"r_x3": 93.2,
"r_y3": 257.3,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.5,
"r_y0": 261.4,
"r_x1": 129.9,
"r_y1": 261.4,
"r_x2": 129.9,
"r_y2": 257.1,
"r_x3": 116.5,
"r_y3": 257.1,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 260.7,
"r_x1": 190.9,
"r_y1": 260.7,
"r_x2": 190.9,
"r_y2": 256.3,
"r_x3": 183.1,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "177",
"orig": "177",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 260.7,
"r_x1": 212.9,
"r_y1": 260.7,
"r_x2": 212.9,
"r_y2": 256.3,
"r_x3": 210.3,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 260.7,
"r_x1": 240.0,
"r_y1": 260.7,
"r_x2": 240.0,
"r_y2": 256.3,
"r_x3": 232.3,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "176",
"orig": "176",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 260.7,
"r_x1": 264.6,
"r_y1": 260.7,
"r_x2": 264.6,
"r_y2": 256.3,
"r_x3": 256.9,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 260.7,
"r_x1": 289.2,
"r_y1": 260.7,
"r_x2": 289.2,
"r_y2": 256.3,
"r_x3": 281.5,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "236",
"orig": "236",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 268.7,
"r_x1": 60.7,
"r_y1": 268.7,
"r_x2": 60.7,
"r_y2": 264.5,
"r_x3": 55.5,
"r_y3": 264.5,
"coord_origin": "TOPLEFT"
},
"text": "\u7b2c",
"orig": "\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.2,
"r_y0": 268.7,
"r_x1": 65.3,
"r_y1": 268.7,
"r_x2": 65.3,
"r_y2": 264.3,
"r_x3": 60.2,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.3,
"r_y0": 268.7,
"r_x1": 122.4,
"r_y1": 268.7,
"r_x2": 122.4,
"r_y2": 264.5,
"r_x3": 65.3,
"r_y3": 264.5,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.5,
"r_y0": 268.7,
"r_x1": 129.9,
"r_y1": 268.7,
"r_x2": 129.9,
"r_y2": 264.3,
"r_x3": 116.5,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 267.9,
"r_x1": 190.9,
"r_y1": 267.9,
"r_x2": 190.9,
"r_y2": 263.5,
"r_x3": 183.1,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "208",
"orig": "208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 267.9,
"r_x1": 212.9,
"r_y1": 267.9,
"r_x2": 212.9,
"r_y2": 263.5,
"r_x3": 210.3,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 267.9,
"r_x1": 240.0,
"r_y1": 267.9,
"r_x2": 240.0,
"r_y2": 263.5,
"r_x3": 232.3,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "203",
"orig": "203",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 267.9,
"r_x1": 264.6,
"r_y1": 267.9,
"r_x2": 264.6,
"r_y2": 263.5,
"r_x3": 256.9,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "152",
"orig": "152",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 267.9,
"r_x1": 289.2,
"r_y1": 267.9,
"r_x2": 289.2,
"r_y2": 263.5,
"r_x3": 281.5,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "244",
"orig": "244",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 275.9,
"r_x1": 107.4,
"r_y1": 275.9,
"r_x2": 107.4,
"r_y2": 271.7,
"r_x3": 55.5,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 102.0,
"r_y0": 275.9,
"r_x1": 109.7,
"r_y1": 275.9,
"r_x2": 109.7,
"r_y2": 271.5,
"r_x3": 102.0,
"r_y3": 271.5,
"coord_origin": "TOPLEFT"
},
"text": "146",
"orig": "146",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 109.7,
"r_y0": 275.9,
"r_x1": 114.9,
"r_y1": 275.9,
"r_x2": 114.9,
"r_y2": 271.7,
"r_x3": 109.7,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u301c",
"orig": "\u301c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 114.4,
"r_y0": 275.9,
"r_x1": 122.1,
"r_y1": 275.9,
"r_x2": 122.1,
"r_y2": 271.5,
"r_x3": 114.4,
"r_y3": 271.5,
"coord_origin": "TOPLEFT"
},
"text": "155",
"orig": "155",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.1,
"r_y0": 275.9,
"r_x1": 127.3,
"r_y1": 275.9,
"r_x2": 127.3,
"r_y2": 271.7,
"r_x3": 122.1,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u56de",
"orig": "\u56de",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 275.1,
"r_x1": 189.6,
"r_y1": 275.1,
"r_x2": 189.6,
"r_y2": 270.8,
"r_x3": 184.4,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "98",
"orig": "98",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 275.1,
"r_x1": 212.9,
"r_y1": 275.1,
"r_x2": 212.9,
"r_y2": 270.8,
"r_x3": 210.3,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.6,
"r_y0": 275.1,
"r_x1": 238.8,
"r_y1": 275.1,
"r_x2": 238.8,
"r_y2": 270.8,
"r_x3": 233.6,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 275.1,
"r_x1": 264.6,
"r_y1": 275.1,
"r_x2": 264.6,
"r_y2": 270.8,
"r_x3": 256.9,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 275.1,
"r_x1": 289.2,
"r_y1": 275.1,
"r_x2": 289.2,
"r_y2": 270.8,
"r_x3": 281.5,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "232",
"orig": "232",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 283.4,
"r_x1": 68.7,
"r_y1": 283.4,
"r_x2": 68.7,
"r_y2": 279.0,
"r_x3": 55.5,
"r_y3": 279.0,
"coord_origin": "TOPLEFT"
},
"text": "WWW",
"orig": "WWW",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.7,
"r_y0": 283.4,
"r_x1": 110.2,
"r_y1": 283.4,
"r_x2": 110.2,
"r_y2": 279.2,
"r_x3": 68.7,
"r_y3": 279.2,
"coord_origin": "TOPLEFT"
},
"text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 282.3,
"r_x1": 190.9,
"r_y1": 282.3,
"r_x2": 190.9,
"r_y2": 278.0,
"r_x3": 183.1,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "107",
"orig": "107",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 282.3,
"r_x1": 214.2,
"r_y1": 282.3,
"r_x2": 214.2,
"r_y2": 278.0,
"r_x3": 209.0,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "73",
"orig": "73",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.6,
"r_y0": 282.3,
"r_x1": 238.8,
"r_y1": 282.3,
"r_x2": 238.8,
"r_y2": 278.0,
"r_x3": 233.6,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 282.3,
"r_x1": 264.6,
"r_y1": 282.3,
"r_x2": 264.6,
"r_y2": 278.0,
"r_x3": 256.9,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 282.8,
"r_y0": 282.3,
"r_x1": 287.9,
"r_y1": 282.3,
"r_x2": 287.9,
"r_y2": 278.0,
"r_x3": 282.8,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 169.6,
"r_y0": 290.6,
"r_x1": 174.8,
"r_y1": 290.6,
"r_x2": 174.8,
"r_y2": 286.5,
"r_x3": 169.6,
"r_y3": 286.5,
"coord_origin": "TOPLEFT"
},
"text": "\u8a08",
"orig": "\u8a08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 289.8,
"r_x1": 190.9,
"r_y1": 289.8,
"r_x2": 190.9,
"r_y2": 285.5,
"r_x3": 183.1,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "945",
"orig": "945",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 289.8,
"r_x1": 215.4,
"r_y1": 289.8,
"r_x2": 215.4,
"r_y2": 285.5,
"r_x3": 207.7,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "294",
"orig": "294",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 289.8,
"r_x1": 240.0,
"r_y1": 289.8,
"r_x2": 240.0,
"r_y2": 285.5,
"r_x3": 232.3,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "651",
"orig": "651",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.8,
"r_y0": 289.8,
"r_x1": 265.8,
"r_y1": 289.8,
"r_x2": 265.8,
"r_y2": 285.5,
"r_x3": 255.8,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "1122",
"orig": "1122",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 289.8,
"r_x1": 289.2,
"r_y1": 289.8,
"r_x2": 289.2,
"r_y2": 285.5,
"r_x3": 281.5,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "955",
"orig": "955",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 380.4,
"r_y0": 298.6,
"r_x1": 549.4,
"r_y1": 298.6,
"r_x2": 549.4,
"r_y2": 292.3,
"r_x3": 380.4,
"r_y3": 292.3,
"coord_origin": "TOPLEFT"
},
"text": "Text is aligned to match original for ease of viewing",
"orig": "Text is aligned to match original for ease of viewing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.0,
"r_y0": 226.7,
"r_x1": 542.0,
"r_y1": 226.7,
"r_x2": 542.0,
"r_y2": 221.6,
"r_x3": 459.0,
"r_y3": 221.6,
"coord_origin": "TOPLEFT"
},
"text": "Weighted Average Grant Date Fair",
"orig": "Weighted Average Grant Date Fair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.8,
"r_y0": 232.9,
"r_x1": 507.2,
"r_y1": 232.9,
"r_x2": 507.2,
"r_y2": 227.8,
"r_x3": 493.8,
"r_y3": 227.8,
"coord_origin": "TOPLEFT"
},
"text": "Value",
"orig": "Value",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.2,
"r_y0": 241.8,
"r_x1": 400.7,
"r_y1": 241.8,
"r_x2": 400.7,
"r_y2": 236.7,
"r_x3": 393.2,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "RS",
"orig": "RS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 241.8,
"r_x1": 404.6,
"r_y1": 241.8,
"r_x2": 404.6,
"r_y2": 236.7,
"r_x3": 400.7,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "U",
"orig": "U",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 404.6,
"r_y0": 241.8,
"r_x1": 407.3,
"r_y1": 241.8,
"r_x2": 407.3,
"r_y2": 236.7,
"r_x3": 404.6,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "s",
"orig": "s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 392.1,
"r_y0": 226.6,
"r_x1": 438.0,
"r_y1": 226.6,
"r_x2": 438.0,
"r_y2": 221.6,
"r_x3": 392.1,
"r_y3": 221.6,
"coord_origin": "TOPLEFT"
},
"text": "Shares (in millions)",
"orig": "Shares (in millions)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.2,
"r_y0": 241.8,
"r_x1": 441.0,
"r_y1": 241.8,
"r_x2": 441.0,
"r_y2": 236.7,
"r_x3": 427.2,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.4,
"r_y0": 241.8,
"r_x1": 482.5,
"r_y1": 241.8,
"r_x2": 482.5,
"r_y2": 236.7,
"r_x3": 468.4,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "RSUs",
"orig": "RSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.9,
"r_y0": 241.8,
"r_x1": 530.7,
"r_y1": 241.8,
"r_x2": 530.7,
"r_y2": 236.7,
"r_x3": 516.9,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 249.7,
"r_x1": 355.7,
"r_y1": 249.7,
"r_x2": 355.7,
"r_y2": 244.6,
"r_x3": 306.1,
"r_y3": 244.6,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on Janua",
"orig": "Nonvested on Janua",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 355.7,
"r_y0": 249.7,
"r_x1": 364.7,
"r_y1": 249.7,
"r_x2": 364.7,
"r_y2": 244.6,
"r_x3": 355.7,
"r_y3": 244.6,
"coord_origin": "TOPLEFT"
},
"text": "ry 1",
"orig": "ry 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 250.0,
"r_x1": 400.8,
"r_y1": 250.0,
"r_x2": 400.8,
"r_y2": 244.9,
"r_x3": 396.2,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.8,
"r_y0": 250.0,
"r_x1": 403.8,
"r_y1": 250.0,
"r_x2": 403.8,
"r_y2": 244.9,
"r_x3": 400.8,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.8,
"r_y0": 250.0,
"r_x1": 437.3,
"r_y1": 250.0,
"r_x2": 437.3,
"r_y2": 244.9,
"r_x3": 429.8,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.5,
"r_y0": 250.0,
"r_x1": 478.4,
"r_y1": 250.0,
"r_x2": 478.4,
"r_y2": 244.9,
"r_x3": 465.5,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "90.10",
"orig": "90.10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 481.0,
"r_y0": 250.0,
"r_x1": 483.6,
"r_y1": 250.0,
"r_x2": 483.6,
"r_y2": 244.9,
"r_x3": 481.0,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "$",
"orig": "$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.4,
"r_y0": 250.0,
"r_x1": 531.5,
"r_y1": 250.0,
"r_x2": 531.5,
"r_y2": 244.9,
"r_x3": 513.4,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "$ 91.19",
"orig": "$ 91.19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 258.7,
"r_x1": 325.6,
"r_y1": 258.7,
"r_x2": 325.6,
"r_y2": 253.7,
"r_x3": 306.1,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Granted",
"orig": "Granted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 258.7,
"r_x1": 400.8,
"r_y1": 258.7,
"r_x2": 400.8,
"r_y2": 253.7,
"r_x3": 396.2,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "0.",
"orig": "0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.8,
"r_y0": 258.7,
"r_x1": 403.8,
"r_y1": 258.7,
"r_x2": 403.8,
"r_y2": 253.7,
"r_x3": 400.8,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.8,
"r_y0": 258.7,
"r_x1": 437.3,
"r_y1": 258.7,
"r_x2": 437.3,
"r_y2": 253.7,
"r_x3": 429.8,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "0.1",
"orig": "0.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.4,
"r_y0": 258.7,
"r_x1": 482.5,
"r_y1": 258.7,
"r_x2": 482.5,
"r_y2": 253.7,
"r_x3": 466.4,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "117.44",
"orig": "117.44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.3,
"r_y0": 258.7,
"r_x1": 530.8,
"r_y1": 258.7,
"r_x2": 530.8,
"r_y2": 253.7,
"r_x3": 514.3,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "122.41",
"orig": "122.41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 266.6,
"r_x1": 322.6,
"r_y1": 266.6,
"r_x2": 322.6,
"r_y2": 261.5,
"r_x3": 306.1,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "Vested",
"orig": "Vested",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.4,
"r_y0": 266.6,
"r_x1": 400.7,
"r_y1": 266.6,
"r_x2": 400.7,
"r_y2": 261.5,
"r_x3": 394.4,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 266.6,
"r_x1": 403.7,
"r_y1": 266.6,
"r_x2": 403.7,
"r_y2": 261.5,
"r_x3": 400.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.7,
"r_y0": 266.6,
"r_x1": 405.5,
"r_y1": 266.6,
"r_x2": 405.5,
"r_y2": 261.5,
"r_x3": 403.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.7,
"r_y0": 266.6,
"r_x1": 438.8,
"r_y1": 266.6,
"r_x2": 438.8,
"r_y2": 261.5,
"r_x3": 427.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "(0.1)",
"orig": "(0.1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.6,
"r_y0": 266.6,
"r_x1": 482.1,
"r_y1": 266.6,
"r_x2": 482.1,
"r_y2": 261.5,
"r_x3": 468.6,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "87.08",
"orig": "87.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.0,
"r_y0": 266.6,
"r_x1": 529.5,
"r_y1": 266.6,
"r_x2": 529.5,
"r_y2": 261.5,
"r_x3": 516.0,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "81.14",
"orig": "81.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 274.7,
"r_x1": 356.2,
"r_y1": 274.7,
"r_x2": 356.2,
"r_y2": 269.6,
"r_x3": 306.1,
"r_y3": 269.6,
"coord_origin": "TOPLEFT"
},
"text": "Canceled or forfeited",
"orig": "Canceled or forfeited",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.4,
"r_y0": 275.4,
"r_x1": 400.7,
"r_y1": 275.4,
"r_x2": 400.7,
"r_y2": 270.3,
"r_x3": 394.4,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 275.4,
"r_x1": 403.7,
"r_y1": 275.4,
"r_x2": 403.7,
"r_y2": 270.3,
"r_x3": 400.7,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.7,
"r_y0": 275.4,
"r_x1": 405.5,
"r_y1": 275.4,
"r_x2": 405.5,
"r_y2": 270.3,
"r_x3": 403.7,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.0,
"r_y0": 275.4,
"r_x1": 436.4,
"r_y1": 275.4,
"r_x2": 436.4,
"r_y2": 270.3,
"r_x3": 431.0,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.8,
"r_y0": 275.4,
"r_x1": 482.4,
"r_y1": 275.4,
"r_x2": 482.4,
"r_y2": 270.3,
"r_x3": 465.8,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "102.01",
"orig": "102.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.0,
"r_y0": 275.4,
"r_x1": 529.5,
"r_y1": 275.4,
"r_x2": 529.5,
"r_y2": 270.3,
"r_x3": 516.0,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "92.18",
"orig": "92.18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 283.6,
"r_x1": 373.4,
"r_y1": 283.6,
"r_x2": 373.4,
"r_y2": 278.5,
"r_x3": 306.1,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on December 31",
"orig": "Nonvested on December 31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 283.6,
"r_x1": 403.8,
"r_y1": 283.6,
"r_x2": 403.8,
"r_y2": 278.5,
"r_x3": 396.2,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "1.0",
"orig": "1.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.5,
"r_y0": 283.6,
"r_x1": 437.0,
"r_y1": 283.6,
"r_x2": 437.0,
"r_y2": 278.5,
"r_x3": 429.5,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.7,
"r_y0": 283.6,
"r_x1": 484.7,
"r_y1": 283.6,
"r_x2": 484.7,
"r_y2": 278.5,
"r_x3": 463.7,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "104.85 $",
"orig": "104.85 $",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.0,
"r_y0": 283.6,
"r_x1": 534.0,
"r_y1": 283.6,
"r_x2": 534.0,
"r_y2": 278.5,
"r_x3": 513.0,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "$ 104.51",
"orig": "$ 104.51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 329.8,
"r_x1": 86.9,
"r_y1": 329.8,
"r_x2": 86.9,
"r_y2": 320.9,
"r_x3": 50.1,
"r_y3": 320.9,
"coord_origin": "TOPLEFT"
},
"text": "Figure 5:",
"orig": "Figure 5:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.9,
"r_y0": 329.8,
"r_x1": 545.1,
"r_y1": 329.8,
"r_x2": 545.1,
"r_y2": 320.9,
"r_x3": 93.9,
"r_y3": 320.9,
"coord_origin": "TOPLEFT"
},
"text": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration",
"orig": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 341.7,
"r_x1": 545.1,
"r_y1": 341.7,
"r_x2": 545.1,
"r_y2": 332.8,
"r_x3": 50.1,
"r_y3": 332.8,
"coord_origin": "TOPLEFT"
},
"text": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is",
"orig": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 353.7,
"r_x1": 545.1,
"r_y1": 353.7,
"r_x2": 545.1,
"r_y2": 344.8,
"r_x3": 50.1,
"r_y3": 344.8,
"coord_origin": "TOPLEFT"
},
"text": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from",
"orig": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 365.6,
"r_x1": 139.8,
"r_y1": 365.6,
"r_x2": 139.8,
"r_y2": 356.7,
"r_x3": 50.1,
"r_y3": 356.7,
"coord_origin": "TOPLEFT"
},
"text": "the FinTabNet dataset.",
"orig": "the FinTabNet dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.3,
"r_y0": 386.4,
"r_x1": 342.1,
"r_y1": 386.4,
"r_x2": 342.1,
"r_y2": 381.8,
"r_x3": 220.3,
"r_y3": 381.8,
"coord_origin": "TOPLEFT"
},
"text": "Red - PDF cells, Green - predicted bounding boxes",
"orig": "Red - PDF cells, Green - predicted bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.7,
"r_y0": 386.4,
"r_x1": 85.7,
"r_y1": 386.4,
"r_x2": 85.7,
"r_y2": 381.8,
"r_x3": 53.7,
"r_y3": 381.8,
"coord_origin": "TOPLEFT"
},
"text": "Ground Truth",
"orig": "Ground Truth",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 406.9,
"r_x1": 443.7,
"r_y1": 406.9,
"r_x2": 443.7,
"r_y2": 400.6,
"r_x3": 437.4,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 406.9,
"r_x1": 456.7,
"r_y1": 406.9,
"r_x2": 456.7,
"r_y2": 400.6,
"r_x3": 450.3,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 406.9,
"r_x1": 469.6,
"r_y1": 406.9,
"r_x2": 469.6,
"r_y2": 400.6,
"r_x3": 463.3,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 406.9,
"r_x1": 482.6,
"r_y1": 406.9,
"r_x2": 482.6,
"r_y2": 400.6,
"r_x3": 476.2,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 406.9,
"r_x1": 495.5,
"r_y1": 406.9,
"r_x2": 495.5,
"r_y2": 400.6,
"r_x3": 489.2,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 406.9,
"r_x1": 508.5,
"r_y1": 406.9,
"r_x2": 508.5,
"r_y2": 400.6,
"r_x3": 502.1,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "21",
"orig": "21",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 406.9,
"r_x1": 521.4,
"r_y1": 406.9,
"r_x2": 521.4,
"r_y2": 400.6,
"r_x3": 515.1,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "22",
"orig": "22",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 417.4,
"r_x1": 391.6,
"r_y1": 417.4,
"r_x2": 391.6,
"r_y2": 411.0,
"r_x3": 385.3,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "23",
"orig": "23",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 417.4,
"r_x1": 404.8,
"r_y1": 417.4,
"r_x2": 404.8,
"r_y2": 411.0,
"r_x3": 398.5,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "24",
"orig": "24",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 417.4,
"r_x1": 417.8,
"r_y1": 417.4,
"r_x2": 417.8,
"r_y2": 411.0,
"r_x3": 411.5,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "25",
"orig": "25",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 417.4,
"r_x1": 443.7,
"r_y1": 417.4,
"r_x2": 443.7,
"r_y2": 411.0,
"r_x3": 437.4,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "26",
"orig": "26",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 417.4,
"r_x1": 456.7,
"r_y1": 417.4,
"r_x2": 456.7,
"r_y2": 411.0,
"r_x3": 450.3,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "27",
"orig": "27",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 417.4,
"r_x1": 469.6,
"r_y1": 417.4,
"r_x2": 469.6,
"r_y2": 411.0,
"r_x3": 463.3,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "28",
"orig": "28",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 427.4,
"r_x1": 391.6,
"r_y1": 427.4,
"r_x2": 391.6,
"r_y2": 421.1,
"r_x3": 385.3,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 427.4,
"r_x1": 404.8,
"r_y1": 427.4,
"r_x2": 404.8,
"r_y2": 421.1,
"r_x3": 398.5,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "31",
"orig": "31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 427.4,
"r_x1": 417.8,
"r_y1": 427.4,
"r_x2": 417.8,
"r_y2": 421.1,
"r_x3": 411.5,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "32",
"orig": "32",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 427.4,
"r_x1": 430.7,
"r_y1": 427.4,
"r_x2": 430.7,
"r_y2": 421.1,
"r_x3": 424.4,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "33",
"orig": "33",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 427.4,
"r_x1": 443.7,
"r_y1": 427.4,
"r_x2": 443.7,
"r_y2": 421.1,
"r_x3": 437.4,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 427.4,
"r_x1": 456.7,
"r_y1": 427.4,
"r_x2": 456.7,
"r_y2": 421.1,
"r_x3": 450.3,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "35",
"orig": "35",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 427.4,
"r_x1": 469.6,
"r_y1": 427.4,
"r_x2": 469.6,
"r_y2": 421.1,
"r_x3": 463.3,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "36",
"orig": "36",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 427.4,
"r_x1": 482.6,
"r_y1": 427.4,
"r_x2": 482.6,
"r_y2": 421.1,
"r_x3": 476.2,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "37",
"orig": "37",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 427.4,
"r_x1": 495.5,
"r_y1": 427.4,
"r_x2": 495.5,
"r_y2": 421.1,
"r_x3": 489.2,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "38",
"orig": "38",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 427.4,
"r_x1": 508.5,
"r_y1": 427.4,
"r_x2": 508.5,
"r_y2": 421.1,
"r_x3": 502.1,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "39",
"orig": "39",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 427.4,
"r_x1": 521.4,
"r_y1": 427.4,
"r_x2": 521.4,
"r_y2": 421.1,
"r_x3": 515.1,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.0,
"r_y0": 427.4,
"r_x1": 534.4,
"r_y1": 427.4,
"r_x2": 534.4,
"r_y2": 421.1,
"r_x3": 528.0,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "41",
"orig": "41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 438.4,
"r_x1": 391.6,
"r_y1": 438.4,
"r_x2": 391.6,
"r_y2": 432.0,
"r_x3": 385.3,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "42",
"orig": "42",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 438.4,
"r_x1": 404.8,
"r_y1": 438.4,
"r_x2": 404.8,
"r_y2": 432.0,
"r_x3": 398.5,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "43",
"orig": "43",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 438.4,
"r_x1": 417.8,
"r_y1": 438.4,
"r_x2": 417.8,
"r_y2": 432.0,
"r_x3": 411.5,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "44",
"orig": "44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 438.4,
"r_x1": 430.7,
"r_y1": 438.4,
"r_x2": 430.7,
"r_y2": 432.0,
"r_x3": 424.4,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "45",
"orig": "45",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 438.4,
"r_x1": 443.7,
"r_y1": 438.4,
"r_x2": 443.7,
"r_y2": 432.0,
"r_x3": 437.4,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "46",
"orig": "46",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 438.4,
"r_x1": 456.7,
"r_y1": 438.4,
"r_x2": 456.7,
"r_y2": 432.0,
"r_x3": 450.3,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "47",
"orig": "47",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 438.4,
"r_x1": 469.6,
"r_y1": 438.4,
"r_x2": 469.6,
"r_y2": 432.0,
"r_x3": 463.3,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "48",
"orig": "48",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 438.4,
"r_x1": 482.6,
"r_y1": 438.4,
"r_x2": 482.6,
"r_y2": 432.0,
"r_x3": 476.2,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "49",
"orig": "49",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 438.4,
"r_x1": 495.5,
"r_y1": 438.4,
"r_x2": 495.5,
"r_y2": 432.0,
"r_x3": 489.2,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 438.4,
"r_x1": 508.5,
"r_y1": 438.4,
"r_x2": 508.5,
"r_y2": 432.0,
"r_x3": 502.1,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "51",
"orig": "51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 438.4,
"r_x1": 521.4,
"r_y1": 438.4,
"r_x2": 521.4,
"r_y2": 432.0,
"r_x3": 515.1,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "52",
"orig": "52",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.0,
"r_y0": 438.4,
"r_x1": 534.4,
"r_y1": 438.4,
"r_x2": 534.4,
"r_y2": 432.0,
"r_x3": 528.0,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "53",
"orig": "53",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 395.5,
"r_x1": 388.4,
"r_y1": 395.5,
"r_x2": 388.4,
"r_y2": 389.2,
"r_x3": 385.3,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 395.5,
"r_x1": 401.7,
"r_y1": 395.5,
"r_x2": 401.7,
"r_y2": 389.2,
"r_x3": 398.5,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 395.5,
"r_x1": 414.6,
"r_y1": 395.5,
"r_x2": 414.6,
"r_y2": 389.2,
"r_x3": 411.5,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 395.5,
"r_x1": 427.6,
"r_y1": 395.5,
"r_x2": 427.6,
"r_y2": 389.2,
"r_x3": 424.4,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 395.5,
"r_x1": 440.5,
"r_y1": 395.5,
"r_x2": 440.5,
"r_y2": 389.2,
"r_x3": 437.4,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 395.5,
"r_x1": 453.5,
"r_y1": 395.5,
"r_x2": 453.5,
"r_y2": 389.2,
"r_x3": 450.3,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 395.5,
"r_x1": 466.4,
"r_y1": 395.5,
"r_x2": 466.4,
"r_y2": 389.2,
"r_x3": 463.3,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 395.5,
"r_x1": 479.4,
"r_y1": 395.5,
"r_x2": 479.4,
"r_y2": 389.2,
"r_x3": 476.2,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 395.5,
"r_x1": 492.3,
"r_y1": 395.5,
"r_x2": 492.3,
"r_y2": 389.2,
"r_x3": 489.2,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 395.5,
"r_x1": 505.3,
"r_y1": 395.5,
"r_x2": 505.3,
"r_y2": 389.2,
"r_x3": 502.1,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 395.5,
"r_x1": 521.4,
"r_y1": 395.5,
"r_x2": 521.4,
"r_y2": 389.2,
"r_x3": 515.1,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.0,
"r_y0": 395.5,
"r_x1": 534.1,
"r_y1": 395.5,
"r_x2": 534.1,
"r_y2": 389.2,
"r_x3": 528.0,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 405.3,
"r_x1": 391.6,
"r_y1": 405.3,
"r_x2": 391.6,
"r_y2": 399.0,
"r_x3": 385.3,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 405.3,
"r_x1": 404.8,
"r_y1": 405.3,
"r_x2": 404.8,
"r_y2": 399.0,
"r_x3": 398.5,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 405.3,
"r_x1": 417.8,
"r_y1": 405.3,
"r_x2": 417.8,
"r_y2": 399.0,
"r_x3": 411.5,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 413.1,
"r_x1": 430.7,
"r_y1": 413.1,
"r_x2": 430.7,
"r_y2": 406.8,
"r_x3": 424.4,
"r_y3": 406.8,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.9,
"r_y0": 417.3,
"r_x1": 509.2,
"r_y1": 417.3,
"r_x2": 509.2,
"r_y2": 411.0,
"r_x3": 502.9,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "29",
"orig": "29",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.4,
"r_y0": 386.4,
"r_x1": 431.0,
"r_y1": 386.4,
"r_x2": 431.0,
"r_y2": 381.8,
"r_x3": 384.4,
"r_y3": 381.8,
"coord_origin": "TOPLEFT"
},
"text": "Predicted Structure",
"orig": "Predicted Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.6,
"r_y0": 467.6,
"r_x1": 532.6,
"r_y1": 467.6,
"r_x2": 532.6,
"r_y2": 458.7,
"r_x3": 62.6,
"r_y3": 458.7,
"coord_origin": "TOPLEFT"
},
"text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.",
"orig": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 501.2,
"r_x1": 64.4,
"r_y1": 501.2,
"r_x2": 64.4,
"r_y2": 491.4,
"r_x3": 50.1,
"r_y3": 491.4,
"coord_origin": "TOPLEFT"
},
"text": "5.5.",
"orig": "5.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.0,
"r_y0": 501.2,
"r_x1": 163.8,
"r_y1": 501.2,
"r_x2": 163.8,
"r_y2": 491.4,
"r_x3": 74.0,
"r_y3": 491.4,
"coord_origin": "TOPLEFT"
},
"text": "Qualitative Analysis",
"orig": "Qualitative Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 545.8,
"r_x1": 286.4,
"r_y1": 545.8,
"r_x2": 286.4,
"r_y2": 536.9,
"r_x3": 62.1,
"r_y3": 536.9,
"coord_origin": "TOPLEFT"
},
"text": "We showcase several visualizations for the different",
"orig": "We showcase several visualizations for the different",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 557.7,
"r_x1": 211.2,
"r_y1": 557.7,
"r_x2": 211.2,
"r_y2": 548.8,
"r_x3": 50.1,
"r_y3": 548.8,
"coord_origin": "TOPLEFT"
},
"text": "components of our network on various",
"orig": "components of our network on various",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 215.1,
"r_y0": 557.5,
"r_x1": 259.2,
"r_y1": 557.5,
"r_x2": 259.2,
"r_y2": 548.9,
"r_x3": 215.1,
"r_y3": 548.9,
"coord_origin": "TOPLEFT"
},
"text": "\u201ccomplex\u201d",
"orig": "\u201ccomplex\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.1,
"r_y0": 557.7,
"r_x1": 286.4,
"r_y1": 557.7,
"r_x2": 286.4,
"r_y2": 548.8,
"r_x3": 263.1,
"r_y3": 548.8,
"coord_origin": "TOPLEFT"
},
"text": "tables",
"orig": "tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 569.7,
"r_x1": 286.4,
"r_y1": 569.7,
"r_x2": 286.4,
"r_y2": 560.8,
"r_x3": 50.1,
"r_y3": 560.8,
"coord_origin": "TOPLEFT"
},
"text": "within datasets presented in this work in Fig. 5 and Fig. 6",
"orig": "within datasets presented in this work in Fig. 5 and Fig. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 581.6,
"r_x1": 286.4,
"r_y1": 581.6,
"r_x2": 286.4,
"r_y2": 572.7,
"r_x3": 50.1,
"r_y3": 572.7,
"coord_origin": "TOPLEFT"
},
"text": "As it is shown, our model is able to predict bounding boxes",
"orig": "As it is shown, our model is able to predict bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 593.6,
"r_x1": 286.4,
"r_y1": 593.6,
"r_x2": 286.4,
"r_y2": 584.7,
"r_x3": 50.1,
"r_y3": 584.7,
"coord_origin": "TOPLEFT"
},
"text": "for all table cells, even for the empty ones. Additionally,",
"orig": "for all table cells, even for the empty ones. Additionally,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 605.6,
"r_x1": 286.4,
"r_y1": 605.6,
"r_x2": 286.4,
"r_y2": 596.6,
"r_x3": 50.1,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "our post-processing techniques can extract the cell content",
"orig": "our post-processing techniques can extract the cell content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 617.5,
"r_x1": 286.4,
"r_y1": 617.5,
"r_x2": 286.4,
"r_y2": 608.6,
"r_x3": 50.1,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "by matching the predicted bounding boxes to the PDF cells",
"orig": "by matching the predicted bounding boxes to the PDF cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 629.5,
"r_x1": 286.4,
"r_y1": 629.5,
"r_x2": 286.4,
"r_y2": 620.6,
"r_x3": 50.1,
"r_y3": 620.6,
"coord_origin": "TOPLEFT"
},
"text": "based on their overlap and spatial proximity. The left part",
"orig": "based on their overlap and spatial proximity. The left part",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 641.4,
"r_x1": 286.4,
"r_y1": 641.4,
"r_x2": 286.4,
"r_y2": 632.5,
"r_x3": 50.1,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": "of Fig. 5 demonstrates also the adaptability of our method",
"orig": "of Fig. 5 demonstrates also the adaptability of our method",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 653.4,
"r_x1": 286.4,
"r_y1": 653.4,
"r_x2": 286.4,
"r_y2": 644.5,
"r_x3": 50.1,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "to any language, as it can successfully extract Japanese",
"orig": "to any language, as it can successfully extract Japanese",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 665.3,
"r_x1": 286.4,
"r_y1": 665.3,
"r_x2": 286.4,
"r_y2": 656.4,
"r_x3": 50.1,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "text, although the training set contains only English content.",
"orig": "text, although the training set contains only English content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.3,
"r_x1": 286.4,
"r_y1": 677.3,
"r_x2": 286.4,
"r_y2": 668.4,
"r_x3": 50.1,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "We provide more visualizations including the intermediate",
"orig": "We provide more visualizations including the intermediate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 689.2,
"r_x1": 286.4,
"r_y1": 689.2,
"r_x2": 286.4,
"r_y2": 680.3,
"r_x3": 50.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "steps in the supplementary material. Overall these illustra-",
"orig": "steps in the supplementary material. Overall these illustra-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "tions justify the versatility of our method across a diverse",
"orig": "tions justify the versatility of our method across a diverse",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 226.9,
"r_y1": 713.2,
"r_x2": 226.9,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "range of table appearances and content type.",
"orig": "range of table appearances and content type.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 501.5,
"r_x1": 316.1,
"r_y1": 501.5,
"r_x2": 316.1,
"r_y2": 490.7,
"r_x3": 308.9,
"r_y3": 490.7,
"coord_origin": "TOPLEFT"
},
"text": "6.",
"orig": "6.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 325.7,
"r_y0": 501.5,
"r_x1": 460.8,
"r_y1": 501.5,
"r_x2": 460.8,
"r_y2": 490.7,
"r_x3": 325.7,
"r_y3": 490.7,
"coord_origin": "TOPLEFT"
},
"text": "Future Work & Conclusion",
"orig": "Future Work & Conclusion",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 521.8,
"r_x1": 545.1,
"r_y1": 521.8,
"r_x2": 545.1,
"r_y2": 512.9,
"r_x3": 320.8,
"r_y3": 512.9,
"coord_origin": "TOPLEFT"
},
"text": "In this paper, we presented TableFormer an end-to-end",
"orig": "In this paper, we presented TableFormer an end-to-end",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 533.8,
"r_x1": 545.1,
"r_y1": 533.8,
"r_x2": 545.1,
"r_y2": 524.8,
"r_x3": 308.9,
"r_y3": 524.8,
"coord_origin": "TOPLEFT"
},
"text": "transformer based approach to predict table structures and",
"orig": "transformer based approach to predict table structures and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 545.7,
"r_x1": 545.1,
"r_y1": 545.7,
"r_x2": 545.1,
"r_y2": 536.8,
"r_x3": 308.9,
"r_y3": 536.8,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes of cells from an image. This approach en-",
"orig": "bounding boxes of cells from an image. This approach en-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 557.7,
"r_x1": 545.1,
"r_y1": 557.7,
"r_x2": 545.1,
"r_y2": 548.8,
"r_x3": 308.9,
"r_y3": 548.8,
"coord_origin": "TOPLEFT"
},
"text": "ables us to recreate the table structure, and extract the cell",
"orig": "ables us to recreate the table structure, and extract the cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 569.6,
"r_x1": 545.1,
"r_y1": 569.6,
"r_x2": 545.1,
"r_y2": 560.7,
"r_x3": 308.9,
"r_y3": 560.7,
"coord_origin": "TOPLEFT"
},
"text": "content from PDF or OCR by using bounding boxes. Ad-",
"orig": "content from PDF or OCR by using bounding boxes. Ad-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 581.6,
"r_x1": 545.1,
"r_y1": 581.6,
"r_x2": 545.1,
"r_y2": 572.7,
"r_x3": 308.9,
"r_y3": 572.7,
"coord_origin": "TOPLEFT"
},
"text": "ditionally, it provides the versatility required in real-world",
"orig": "ditionally, it provides the versatility required in real-world",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 593.5,
"r_x1": 545.1,
"r_y1": 593.5,
"r_x2": 545.1,
"r_y2": 584.6,
"r_x3": 308.9,
"r_y3": 584.6,
"coord_origin": "TOPLEFT"
},
"text": "scenarios when dealing with various types of PDF docu-",
"orig": "scenarios when dealing with various types of PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 605.5,
"r_x1": 400.5,
"r_y1": 605.5,
"r_x2": 400.5,
"r_y2": 596.6,
"r_x3": 308.9,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "ments, and languages.",
"orig": "ments, and languages.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.4,
"r_y0": 605.5,
"r_x1": 545.1,
"r_y1": 605.5,
"r_x2": 545.1,
"r_y2": 596.6,
"r_x3": 408.4,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "Furthermore, our method outper-",
"orig": "Furthermore, our method outper-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 212,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 617.4,
"r_x1": 545.1,
"r_y1": 617.4,
"r_x2": 545.1,
"r_y2": 608.5,
"r_x3": 308.9,
"r_y3": 608.5,
"coord_origin": "TOPLEFT"
},
"text": "forms all state-of-the-arts with a wide margin. Finally, we",
"orig": "forms all state-of-the-arts with a wide margin. Finally, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 213,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 629.4,
"r_x1": 545.1,
"r_y1": 629.4,
"r_x2": 545.1,
"r_y2": 620.5,
"r_x3": 308.9,
"r_y3": 620.5,
"coord_origin": "TOPLEFT"
},
"text": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-",
"orig": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 214,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 641.4,
"r_x1": 545.1,
"r_y1": 641.4,
"r_x2": 545.1,
"r_y2": 632.4,
"r_x3": 308.9,
"r_y3": 632.4,
"coord_origin": "TOPLEFT"
},
"text": "erated dataset that reinforces missing characteristics from",
"orig": "erated dataset that reinforces missing characteristics from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 215,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 653.3,
"r_x1": 365.9,
"r_y1": 653.3,
"r_x2": 365.9,
"r_y2": 644.4,
"r_x3": 308.9,
"r_y3": 644.4,
"coord_origin": "TOPLEFT"
},
"text": "other datasets.",
"orig": "other datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 216,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 682.8,
"r_x1": 364.4,
"r_y1": 682.8,
"r_x2": 364.4,
"r_y2": 672.1,
"r_x3": 308.9,
"r_y3": 672.1,
"coord_origin": "TOPLEFT"
},
"text": "References",
"orig": "References",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 217,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.3,
"r_y0": 702.0,
"r_x1": 323.8,
"r_y1": 702.0,
"r_x2": 323.8,
"r_y2": 694.0,
"r_x3": 313.3,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "[1]",
"orig": "[1]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 218,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.1,
"r_y0": 702.0,
"r_x1": 545.1,
"r_y1": 702.0,
"r_x2": 545.1,
"r_y2": 694.0,
"r_x3": 326.1,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas",
"orig": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 219,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 712.9,
"r_x1": 545.1,
"r_y1": 712.9,
"r_x2": 545.1,
"r_y2": 704.9,
"r_x3": 328.8,
"r_y3": 704.9,
"coord_origin": "TOPLEFT"
},
"text": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-",
"orig": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 220,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 18,
"label": "caption",
"bbox": {
"l": 53.8,
"t": 208.2,
"r": 385.9,
"b": 216.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.6,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.8,
"r_y0": 216.1,
"r_x1": 62.2,
"r_y1": 216.1,
"r_x2": 62.2,
"r_y2": 208.2,
"r_x3": 53.8,
"r_y3": 208.2,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.4,
"r_y0": 216.1,
"r_x1": 385.9,
"r_y1": 216.1,
"r_x2": 385.9,
"r_y2": 208.2,
"r_x3": 66.4,
"r_y3": 208.2,
"coord_origin": "TOPLEFT"
},
"text": "Structure predicted by TableFormer, with superimposed matched PDF cell text:",
"orig": "Structure predicted by TableFormer, with superimposed matched PDF cell text:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 29,
"label": "section_header",
"bbox": {
"l": 53.8,
"t": 94.3,
"r": 284.3,
"b": 102.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.46,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.8,
"r_y0": 102.2,
"r_x1": 284.3,
"r_y1": 102.2,
"r_x2": 284.3,
"r_y2": 94.3,
"r_x3": 53.8,
"r_y3": 94.3,
"coord_origin": "TOPLEFT"
},
"text": "Japanese language (previously unseen by TableFormer):",
"orig": "Japanese language (previously unseen by TableFormer):",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 31,
"label": "section_header",
"bbox": {
"l": 304.8,
"t": 94.3,
"r": 431.1,
"b": 102.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.46,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 304.8,
"r_y0": 102.2,
"r_x1": 431.1,
"r_y1": 102.2,
"r_x2": 431.1,
"r_y2": 94.3,
"r_x3": 304.8,
"r_y3": 94.3,
"coord_origin": "TOPLEFT"
},
"text": "Example table from FinTabNet:",
"orig": "Example table from FinTabNet:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 20,
"label": "list_item",
"bbox": {
"l": 53.3,
"t": 78.7,
"r": 61.6,
"b": 86.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.58,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.3,
"r_y0": 86.6,
"r_x1": 61.6,
"r_y1": 86.6,
"r_x2": 61.6,
"r_y2": 78.7,
"r_x3": 53.3,
"r_y3": 78.7,
"coord_origin": "TOPLEFT"
},
"text": "a.",
"orig": "a.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 21,
"label": "list_item",
"bbox": {
"l": 65.7,
"t": 78.7,
"r": 499.6,
"b": 86.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.54,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.7,
"r_y0": 86.6,
"r_x1": 499.6,
"r_y1": 86.6,
"r_x2": 499.6,
"r_y2": 78.7,
"r_x3": 65.7,
"r_y3": 78.7,
"coord_origin": "TOPLEFT"
},
"text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells",
"orig": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 8,
"label": "table",
"bbox": {
"l": 53.6,
"t": 218.9,
"r": 298.6,
"b": 292.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.9,
"r_y0": 226.4,
"r_x1": 241.0,
"r_y1": 226.4,
"r_x2": 241.0,
"r_y2": 222.2,
"r_x3": 209.9,
"r_y3": 222.2,
"coord_origin": "TOPLEFT"
},
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.8,
"r_y0": 226.4,
"r_x1": 284.5,
"r_y1": 226.4,
"r_x2": 284.5,
"r_y2": 222.2,
"r_x3": 263.8,
"r_y3": 222.2,
"coord_origin": "TOPLEFT"
},
"text": "\u53c2\u8003\u6587\u732e",
"orig": "\u53c2\u8003\u6587\u732e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.2,
"r_y0": 233.8,
"r_x1": 120.6,
"r_y1": 233.8,
"r_x2": 120.6,
"r_y2": 229.7,
"r_x3": 110.2,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u51fa\u5178",
"orig": "\u51fa\u5178",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.4,
"r_y0": 233.8,
"r_x1": 196.1,
"r_y1": 233.8,
"r_x2": 196.1,
"r_y2": 229.7,
"r_x3": 175.4,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u30d5\u30a1\u30a4\u30eb",
"orig": "\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.1,
"r_y0": 233.8,
"r_x1": 201.3,
"r_y1": 233.8,
"r_x2": 201.3,
"r_y2": 229.7,
"r_x3": 196.1,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u6570",
"orig": "\u6570",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.6,
"r_y0": 233.8,
"r_x1": 220.0,
"r_y1": 233.8,
"r_x2": 220.0,
"r_y2": 229.7,
"r_x3": 209.6,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.2,
"r_y0": 233.8,
"r_x1": 244.8,
"r_y1": 233.8,
"r_x2": 244.8,
"r_y2": 229.7,
"r_x3": 229.2,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.1,
"r_y0": 233.8,
"r_x1": 266.5,
"r_y1": 233.8,
"r_x2": 266.5,
"r_y2": 229.7,
"r_x3": 256.1,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.4,
"r_y0": 233.8,
"r_x1": 293.9,
"r_y1": 233.8,
"r_x2": 293.9,
"r_y2": 229.7,
"r_x3": 278.4,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 240.8,
"r_x1": 162.7,
"r_y1": 240.8,
"r_x2": 162.7,
"r_y2": 236.4,
"r_x3": 55.5,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "Association for Computational Linguistics(ACL2003)",
"orig": "Association for Computational Linguistics(ACL2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 240.8,
"r_x1": 189.6,
"r_y1": 240.8,
"r_x2": 189.6,
"r_y2": 236.4,
"r_x3": 184.4,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 240.8,
"r_x1": 214.2,
"r_y1": 240.8,
"r_x2": 214.2,
"r_y2": 236.4,
"r_x3": 209.0,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.9,
"r_y0": 240.8,
"r_x1": 237.5,
"r_y1": 240.8,
"r_x2": 237.5,
"r_y2": 236.4,
"r_x3": 234.9,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 240.8,
"r_x1": 264.6,
"r_y1": 240.8,
"r_x2": 264.6,
"r_y2": 236.4,
"r_x3": 256.9,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.1,
"r_y0": 240.8,
"r_x1": 286.6,
"r_y1": 240.8,
"r_x2": 286.6,
"r_y2": 236.4,
"r_x3": 284.1,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 247.0,
"r_x1": 139.7,
"r_y1": 247.0,
"r_x2": 139.7,
"r_y2": 242.6,
"r_x3": 55.5,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "Computational Linguistics(COLING2002)",
"orig": "Computational Linguistics(COLING2002)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 247.0,
"r_x1": 190.9,
"r_y1": 247.0,
"r_x2": 190.9,
"r_y2": 242.6,
"r_x3": 183.1,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 247.0,
"r_x1": 215.4,
"r_y1": 247.0,
"r_x2": 215.4,
"r_y2": 242.6,
"r_x3": 207.7,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.9,
"r_y0": 247.0,
"r_x1": 237.5,
"r_y1": 247.0,
"r_x2": 237.5,
"r_y2": 242.6,
"r_x3": 234.9,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 247.0,
"r_x1": 264.6,
"r_y1": 247.0,
"r_x2": 264.6,
"r_y2": 242.6,
"r_x3": 256.9,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.1,
"r_y0": 247.0,
"r_x1": 286.6,
"r_y1": 247.0,
"r_x2": 286.6,
"r_y2": 242.6,
"r_x3": 284.1,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 254.0,
"r_x1": 97.0,
"r_y1": 254.0,
"r_x2": 97.0,
"r_y2": 249.8,
"r_x3": 55.5,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 92.7,
"r_y0": 253.9,
"r_x1": 103.0,
"r_y1": 253.9,
"r_x2": 103.0,
"r_y2": 249.6,
"r_x3": 92.7,
"r_y3": 249.6,
"coord_origin": "TOPLEFT"
},
"text": "2003",
"orig": "2003",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.0,
"r_y0": 254.0,
"r_x1": 129.0,
"r_y1": 254.0,
"r_x2": 129.0,
"r_y2": 249.8,
"r_x3": 103.0,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"orig": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 253.2,
"r_x1": 190.9,
"r_y1": 253.2,
"r_x2": 190.9,
"r_y2": 248.8,
"r_x3": 183.1,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 253.2,
"r_x1": 212.9,
"r_y1": 253.2,
"r_x2": 212.9,
"r_y2": 248.8,
"r_x3": 210.3,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 253.2,
"r_x1": 240.0,
"r_y1": 253.2,
"r_x2": 240.0,
"r_y2": 248.8,
"r_x3": 232.3,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "142",
"orig": "142",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 253.2,
"r_x1": 264.6,
"r_y1": 253.2,
"r_x2": 264.6,
"r_y2": 248.8,
"r_x3": 256.9,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "223",
"orig": "223",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 253.2,
"r_x1": 289.2,
"r_y1": 253.2,
"r_x2": 289.2,
"r_y2": 248.8,
"r_x3": 281.5,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 261.5,
"r_x1": 91.8,
"r_y1": 261.5,
"r_x2": 91.8,
"r_y2": 257.3,
"r_x3": 55.5,
"r_y3": 257.3,
"coord_origin": "TOPLEFT"
},
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.1,
"r_y0": 261.4,
"r_x1": 93.2,
"r_y1": 261.4,
"r_x2": 93.2,
"r_y2": 257.1,
"r_x3": 88.1,
"r_y3": 257.1,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.2,
"r_y0": 261.5,
"r_x1": 119.1,
"r_y1": 261.5,
"r_x2": 119.1,
"r_y2": 257.3,
"r_x3": 93.2,
"r_y3": 257.3,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.5,
"r_y0": 261.4,
"r_x1": 129.9,
"r_y1": 261.4,
"r_x2": 129.9,
"r_y2": 257.1,
"r_x3": 116.5,
"r_y3": 257.1,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 260.7,
"r_x1": 190.9,
"r_y1": 260.7,
"r_x2": 190.9,
"r_y2": 256.3,
"r_x3": 183.1,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "177",
"orig": "177",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 260.7,
"r_x1": 212.9,
"r_y1": 260.7,
"r_x2": 212.9,
"r_y2": 256.3,
"r_x3": 210.3,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 260.7,
"r_x1": 240.0,
"r_y1": 260.7,
"r_x2": 240.0,
"r_y2": 256.3,
"r_x3": 232.3,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "176",
"orig": "176",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 260.7,
"r_x1": 264.6,
"r_y1": 260.7,
"r_x2": 264.6,
"r_y2": 256.3,
"r_x3": 256.9,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 260.7,
"r_x1": 289.2,
"r_y1": 260.7,
"r_x2": 289.2,
"r_y2": 256.3,
"r_x3": 281.5,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "236",
"orig": "236",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 268.7,
"r_x1": 60.7,
"r_y1": 268.7,
"r_x2": 60.7,
"r_y2": 264.5,
"r_x3": 55.5,
"r_y3": 264.5,
"coord_origin": "TOPLEFT"
},
"text": "\u7b2c",
"orig": "\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.2,
"r_y0": 268.7,
"r_x1": 65.3,
"r_y1": 268.7,
"r_x2": 65.3,
"r_y2": 264.3,
"r_x3": 60.2,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.3,
"r_y0": 268.7,
"r_x1": 122.4,
"r_y1": 268.7,
"r_x2": 122.4,
"r_y2": 264.5,
"r_x3": 65.3,
"r_y3": 264.5,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.5,
"r_y0": 268.7,
"r_x1": 129.9,
"r_y1": 268.7,
"r_x2": 129.9,
"r_y2": 264.3,
"r_x3": 116.5,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 267.9,
"r_x1": 190.9,
"r_y1": 267.9,
"r_x2": 190.9,
"r_y2": 263.5,
"r_x3": 183.1,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "208",
"orig": "208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 267.9,
"r_x1": 212.9,
"r_y1": 267.9,
"r_x2": 212.9,
"r_y2": 263.5,
"r_x3": 210.3,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 267.9,
"r_x1": 240.0,
"r_y1": 267.9,
"r_x2": 240.0,
"r_y2": 263.5,
"r_x3": 232.3,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "203",
"orig": "203",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 267.9,
"r_x1": 264.6,
"r_y1": 267.9,
"r_x2": 264.6,
"r_y2": 263.5,
"r_x3": 256.9,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "152",
"orig": "152",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 267.9,
"r_x1": 289.2,
"r_y1": 267.9,
"r_x2": 289.2,
"r_y2": 263.5,
"r_x3": 281.5,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "244",
"orig": "244",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 275.9,
"r_x1": 107.4,
"r_y1": 275.9,
"r_x2": 107.4,
"r_y2": 271.7,
"r_x3": 55.5,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 102.0,
"r_y0": 275.9,
"r_x1": 109.7,
"r_y1": 275.9,
"r_x2": 109.7,
"r_y2": 271.5,
"r_x3": 102.0,
"r_y3": 271.5,
"coord_origin": "TOPLEFT"
},
"text": "146",
"orig": "146",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 109.7,
"r_y0": 275.9,
"r_x1": 114.9,
"r_y1": 275.9,
"r_x2": 114.9,
"r_y2": 271.7,
"r_x3": 109.7,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u301c",
"orig": "\u301c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 114.4,
"r_y0": 275.9,
"r_x1": 122.1,
"r_y1": 275.9,
"r_x2": 122.1,
"r_y2": 271.5,
"r_x3": 114.4,
"r_y3": 271.5,
"coord_origin": "TOPLEFT"
},
"text": "155",
"orig": "155",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.1,
"r_y0": 275.9,
"r_x1": 127.3,
"r_y1": 275.9,
"r_x2": 127.3,
"r_y2": 271.7,
"r_x3": 122.1,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u56de",
"orig": "\u56de",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 275.1,
"r_x1": 189.6,
"r_y1": 275.1,
"r_x2": 189.6,
"r_y2": 270.8,
"r_x3": 184.4,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "98",
"orig": "98",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 275.1,
"r_x1": 212.9,
"r_y1": 275.1,
"r_x2": 212.9,
"r_y2": 270.8,
"r_x3": 210.3,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.6,
"r_y0": 275.1,
"r_x1": 238.8,
"r_y1": 275.1,
"r_x2": 238.8,
"r_y2": 270.8,
"r_x3": 233.6,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 275.1,
"r_x1": 264.6,
"r_y1": 275.1,
"r_x2": 264.6,
"r_y2": 270.8,
"r_x3": 256.9,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 275.1,
"r_x1": 289.2,
"r_y1": 275.1,
"r_x2": 289.2,
"r_y2": 270.8,
"r_x3": 281.5,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "232",
"orig": "232",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 283.4,
"r_x1": 68.7,
"r_y1": 283.4,
"r_x2": 68.7,
"r_y2": 279.0,
"r_x3": 55.5,
"r_y3": 279.0,
"coord_origin": "TOPLEFT"
},
"text": "WWW",
"orig": "WWW",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.7,
"r_y0": 283.4,
"r_x1": 110.2,
"r_y1": 283.4,
"r_x2": 110.2,
"r_y2": 279.2,
"r_x3": 68.7,
"r_y3": 279.2,
"coord_origin": "TOPLEFT"
},
"text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 282.3,
"r_x1": 190.9,
"r_y1": 282.3,
"r_x2": 190.9,
"r_y2": 278.0,
"r_x3": 183.1,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "107",
"orig": "107",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 282.3,
"r_x1": 214.2,
"r_y1": 282.3,
"r_x2": 214.2,
"r_y2": 278.0,
"r_x3": 209.0,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "73",
"orig": "73",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.6,
"r_y0": 282.3,
"r_x1": 238.8,
"r_y1": 282.3,
"r_x2": 238.8,
"r_y2": 278.0,
"r_x3": 233.6,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 282.3,
"r_x1": 264.6,
"r_y1": 282.3,
"r_x2": 264.6,
"r_y2": 278.0,
"r_x3": 256.9,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 282.8,
"r_y0": 282.3,
"r_x1": 287.9,
"r_y1": 282.3,
"r_x2": 287.9,
"r_y2": 278.0,
"r_x3": 282.8,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 169.6,
"r_y0": 290.6,
"r_x1": 174.8,
"r_y1": 290.6,
"r_x2": 174.8,
"r_y2": 286.5,
"r_x3": 169.6,
"r_y3": 286.5,
"coord_origin": "TOPLEFT"
},
"text": "\u8a08",
"orig": "\u8a08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 289.8,
"r_x1": 190.9,
"r_y1": 289.8,
"r_x2": 190.9,
"r_y2": 285.5,
"r_x3": 183.1,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "945",
"orig": "945",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 289.8,
"r_x1": 215.4,
"r_y1": 289.8,
"r_x2": 215.4,
"r_y2": 285.5,
"r_x3": 207.7,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "294",
"orig": "294",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 289.8,
"r_x1": 240.0,
"r_y1": 289.8,
"r_x2": 240.0,
"r_y2": 285.5,
"r_x3": 232.3,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "651",
"orig": "651",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.8,
"r_y0": 289.8,
"r_x1": 265.8,
"r_y1": 289.8,
"r_x2": 265.8,
"r_y2": 285.5,
"r_x3": 255.8,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "1122",
"orig": "1122",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 289.8,
"r_x1": 289.2,
"r_y1": 289.8,
"r_x2": 289.2,
"r_y2": 285.5,
"r_x3": 281.5,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "955",
"orig": "955",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 55,
"label": "text",
"bbox": {
"l": 209.9,
"t": 222.2,
"r": 241.0,
"b": 226.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.9,
"r_y0": 226.4,
"r_x1": 241.0,
"r_y1": 226.4,
"r_x2": 241.0,
"r_y2": 222.2,
"r_x3": 209.9,
"r_y3": 222.2,
"coord_origin": "TOPLEFT"
},
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 263.8,
"t": 222.2,
"r": 284.5,
"b": 226.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.8,
"r_y0": 226.4,
"r_x1": 284.5,
"r_y1": 226.4,
"r_x2": 284.5,
"r_y2": 222.2,
"r_x3": 263.8,
"r_y3": 222.2,
"coord_origin": "TOPLEFT"
},
"text": "\u53c2\u8003\u6587\u732e",
"orig": "\u53c2\u8003\u6587\u732e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 110.2,
"t": 229.7,
"r": 120.6,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.2,
"r_y0": 233.8,
"r_x1": 120.6,
"r_y1": 233.8,
"r_x2": 120.6,
"r_y2": 229.7,
"r_x3": 110.2,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u51fa\u5178",
"orig": "\u51fa\u5178",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 175.4,
"t": 229.7,
"r": 196.1,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.4,
"r_y0": 233.8,
"r_x1": 196.1,
"r_y1": 233.8,
"r_x2": 196.1,
"r_y2": 229.7,
"r_x3": 175.4,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u30d5\u30a1\u30a4\u30eb",
"orig": "\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 196.1,
"t": 229.7,
"r": 201.3,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.1,
"r_y0": 233.8,
"r_x1": 201.3,
"r_y1": 233.8,
"r_x2": 201.3,
"r_y2": 229.7,
"r_x3": 196.1,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u6570",
"orig": "\u6570",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 209.6,
"t": 229.7,
"r": 220.0,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.6,
"r_y0": 233.8,
"r_x1": 220.0,
"r_y1": 233.8,
"r_x2": 220.0,
"r_y2": 229.7,
"r_x3": 209.6,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 229.2,
"t": 229.7,
"r": 244.8,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.2,
"r_y0": 233.8,
"r_x1": 244.8,
"r_y1": 233.8,
"r_x2": 244.8,
"r_y2": 229.7,
"r_x3": 229.2,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 256.1,
"t": 229.7,
"r": 266.5,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.1,
"r_y0": 233.8,
"r_x1": 266.5,
"r_y1": 233.8,
"r_x2": 266.5,
"r_y2": 229.7,
"r_x3": 256.1,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 278.4,
"t": 229.7,
"r": 293.9,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.4,
"r_y0": 233.8,
"r_x1": 293.9,
"r_y1": 233.8,
"r_x2": 293.9,
"r_y2": 229.7,
"r_x3": 278.4,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 55.5,
"t": 236.4,
"r": 162.7,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 240.8,
"r_x1": 162.7,
"r_y1": 240.8,
"r_x2": 162.7,
"r_y2": 236.4,
"r_x3": 55.5,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "Association for Computational Linguistics(ACL2003)",
"orig": "Association for Computational Linguistics(ACL2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 184.4,
"t": 236.4,
"r": 189.6,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 240.8,
"r_x1": 189.6,
"r_y1": 240.8,
"r_x2": 189.6,
"r_y2": 236.4,
"r_x3": 184.4,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 209.0,
"t": 236.4,
"r": 214.2,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 240.8,
"r_x1": 214.2,
"r_y1": 240.8,
"r_x2": 214.2,
"r_y2": 236.4,
"r_x3": 209.0,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 234.9,
"t": 236.4,
"r": 237.5,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.9,
"r_y0": 240.8,
"r_x1": 237.5,
"r_y1": 240.8,
"r_x2": 237.5,
"r_y2": 236.4,
"r_x3": 234.9,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 256.9,
"t": 236.4,
"r": 264.6,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 240.8,
"r_x1": 264.6,
"r_y1": 240.8,
"r_x2": 264.6,
"r_y2": 236.4,
"r_x3": 256.9,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 284.1,
"t": 236.4,
"r": 286.6,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.1,
"r_y0": 240.8,
"r_x1": 286.6,
"r_y1": 240.8,
"r_x2": 286.6,
"r_y2": 236.4,
"r_x3": 284.1,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 55.5,
"t": 242.6,
"r": 139.7,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 247.0,
"r_x1": 139.7,
"r_y1": 247.0,
"r_x2": 139.7,
"r_y2": 242.6,
"r_x3": 55.5,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "Computational Linguistics(COLING2002)",
"orig": "Computational Linguistics(COLING2002)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 183.1,
"t": 242.6,
"r": 190.9,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 247.0,
"r_x1": 190.9,
"r_y1": 247.0,
"r_x2": 190.9,
"r_y2": 242.6,
"r_x3": 183.1,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 207.7,
"t": 242.6,
"r": 215.4,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 247.0,
"r_x1": 215.4,
"r_y1": 247.0,
"r_x2": 215.4,
"r_y2": 242.6,
"r_x3": 207.7,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 234.9,
"t": 242.6,
"r": 237.5,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.9,
"r_y0": 247.0,
"r_x1": 237.5,
"r_y1": 247.0,
"r_x2": 237.5,
"r_y2": 242.6,
"r_x3": 234.9,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 256.9,
"t": 242.6,
"r": 264.6,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 247.0,
"r_x1": 264.6,
"r_y1": 247.0,
"r_x2": 264.6,
"r_y2": 242.6,
"r_x3": 256.9,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 284.1,
"t": 242.6,
"r": 286.6,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.1,
"r_y0": 247.0,
"r_x1": 286.6,
"r_y1": 247.0,
"r_x2": 286.6,
"r_y2": 242.6,
"r_x3": 284.1,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 55.5,
"t": 249.8,
"r": 97.0,
"b": 254.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 254.0,
"r_x1": 97.0,
"r_y1": 254.0,
"r_x2": 97.0,
"r_y2": 249.8,
"r_x3": 55.5,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 92.7,
"t": 249.6,
"r": 103.0,
"b": 253.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 92.7,
"r_y0": 253.9,
"r_x1": 103.0,
"r_y1": 253.9,
"r_x2": 103.0,
"r_y2": 249.6,
"r_x3": 92.7,
"r_y3": 249.6,
"coord_origin": "TOPLEFT"
},
"text": "2003",
"orig": "2003",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 103.0,
"t": 249.8,
"r": 129.0,
"b": 254.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.0,
"r_y0": 254.0,
"r_x1": 129.0,
"r_y1": 254.0,
"r_x2": 129.0,
"r_y2": 249.8,
"r_x3": 103.0,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"orig": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 183.1,
"t": 248.8,
"r": 190.9,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 253.2,
"r_x1": 190.9,
"r_y1": 253.2,
"r_x2": 190.9,
"r_y2": 248.8,
"r_x3": 183.1,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 210.3,
"t": 248.8,
"r": 212.9,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 253.2,
"r_x1": 212.9,
"r_y1": 253.2,
"r_x2": 212.9,
"r_y2": 248.8,
"r_x3": 210.3,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 232.3,
"t": 248.8,
"r": 240.0,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 253.2,
"r_x1": 240.0,
"r_y1": 253.2,
"r_x2": 240.0,
"r_y2": 248.8,
"r_x3": 232.3,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "142",
"orig": "142",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 256.9,
"t": 248.8,
"r": 264.6,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 253.2,
"r_x1": 264.6,
"r_y1": 253.2,
"r_x2": 264.6,
"r_y2": 248.8,
"r_x3": 256.9,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "223",
"orig": "223",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 83,
"label": "text",
"bbox": {
"l": 281.5,
"t": 248.8,
"r": 289.2,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 253.2,
"r_x1": 289.2,
"r_y1": 253.2,
"r_x2": 289.2,
"r_y2": 248.8,
"r_x3": 281.5,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 55.5,
"t": 257.3,
"r": 91.8,
"b": 261.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 261.5,
"r_x1": 91.8,
"r_y1": 261.5,
"r_x2": 91.8,
"r_y2": 257.3,
"r_x3": 55.5,
"r_y3": 257.3,
"coord_origin": "TOPLEFT"
},
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 88.1,
"t": 257.1,
"r": 93.2,
"b": 261.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.1,
"r_y0": 261.4,
"r_x1": 93.2,
"r_y1": 261.4,
"r_x2": 93.2,
"r_y2": 257.1,
"r_x3": 88.1,
"r_y3": 257.1,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 93.2,
"t": 257.3,
"r": 119.1,
"b": 261.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.2,
"r_y0": 261.5,
"r_x1": 119.1,
"r_y1": 261.5,
"r_x2": 119.1,
"r_y2": 257.3,
"r_x3": 93.2,
"r_y3": 257.3,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 116.5,
"t": 257.1,
"r": 129.9,
"b": 261.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.5,
"r_y0": 261.4,
"r_x1": 129.9,
"r_y1": 261.4,
"r_x2": 129.9,
"r_y2": 257.1,
"r_x3": 116.5,
"r_y3": 257.1,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 183.1,
"t": 256.3,
"r": 190.9,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 260.7,
"r_x1": 190.9,
"r_y1": 260.7,
"r_x2": 190.9,
"r_y2": 256.3,
"r_x3": 183.1,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "177",
"orig": "177",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 210.3,
"t": 256.3,
"r": 212.9,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 260.7,
"r_x1": 212.9,
"r_y1": 260.7,
"r_x2": 212.9,
"r_y2": 256.3,
"r_x3": 210.3,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 232.3,
"t": 256.3,
"r": 240.0,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 260.7,
"r_x1": 240.0,
"r_y1": 260.7,
"r_x2": 240.0,
"r_y2": 256.3,
"r_x3": 232.3,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "176",
"orig": "176",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 256.9,
"t": 256.3,
"r": 264.6,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 260.7,
"r_x1": 264.6,
"r_y1": 260.7,
"r_x2": 264.6,
"r_y2": 256.3,
"r_x3": 256.9,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 281.5,
"t": 256.3,
"r": 289.2,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 260.7,
"r_x1": 289.2,
"r_y1": 260.7,
"r_x2": 289.2,
"r_y2": 256.3,
"r_x3": 281.5,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "236",
"orig": "236",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 55.5,
"t": 264.5,
"r": 60.7,
"b": 268.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 268.7,
"r_x1": 60.7,
"r_y1": 268.7,
"r_x2": 60.7,
"r_y2": 264.5,
"r_x3": 55.5,
"r_y3": 264.5,
"coord_origin": "TOPLEFT"
},
"text": "\u7b2c",
"orig": "\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 60.2,
"t": 264.3,
"r": 65.3,
"b": 268.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.2,
"r_y0": 268.7,
"r_x1": 65.3,
"r_y1": 268.7,
"r_x2": 65.3,
"r_y2": 264.3,
"r_x3": 60.2,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 65.3,
"t": 264.5,
"r": 122.4,
"b": 268.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.3,
"r_y0": 268.7,
"r_x1": 122.4,
"r_y1": 268.7,
"r_x2": 122.4,
"r_y2": 264.5,
"r_x3": 65.3,
"r_y3": 264.5,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 116.5,
"t": 264.3,
"r": 129.9,
"b": 268.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.5,
"r_y0": 268.7,
"r_x1": 129.9,
"r_y1": 268.7,
"r_x2": 129.9,
"r_y2": 264.3,
"r_x3": 116.5,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 183.1,
"t": 263.5,
"r": 190.9,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 267.9,
"r_x1": 190.9,
"r_y1": 267.9,
"r_x2": 190.9,
"r_y2": 263.5,
"r_x3": 183.1,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "208",
"orig": "208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 210.3,
"t": 263.5,
"r": 212.9,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 267.9,
"r_x1": 212.9,
"r_y1": 267.9,
"r_x2": 212.9,
"r_y2": 263.5,
"r_x3": 210.3,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 99,
"label": "text",
"bbox": {
"l": 232.3,
"t": 263.5,
"r": 240.0,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 267.9,
"r_x1": 240.0,
"r_y1": 267.9,
"r_x2": 240.0,
"r_y2": 263.5,
"r_x3": 232.3,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "203",
"orig": "203",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 256.9,
"t": 263.5,
"r": 264.6,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 267.9,
"r_x1": 264.6,
"r_y1": 267.9,
"r_x2": 264.6,
"r_y2": 263.5,
"r_x3": 256.9,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "152",
"orig": "152",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 281.5,
"t": 263.5,
"r": 289.2,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 267.9,
"r_x1": 289.2,
"r_y1": 267.9,
"r_x2": 289.2,
"r_y2": 263.5,
"r_x3": 281.5,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "244",
"orig": "244",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 55.5,
"t": 271.7,
"r": 107.4,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 275.9,
"r_x1": 107.4,
"r_y1": 275.9,
"r_x2": 107.4,
"r_y2": 271.7,
"r_x3": 55.5,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 102.0,
"t": 271.5,
"r": 109.7,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 102.0,
"r_y0": 275.9,
"r_x1": 109.7,
"r_y1": 275.9,
"r_x2": 109.7,
"r_y2": 271.5,
"r_x3": 102.0,
"r_y3": 271.5,
"coord_origin": "TOPLEFT"
},
"text": "146",
"orig": "146",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 109.7,
"t": 271.7,
"r": 114.9,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 109.7,
"r_y0": 275.9,
"r_x1": 114.9,
"r_y1": 275.9,
"r_x2": 114.9,
"r_y2": 271.7,
"r_x3": 109.7,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u301c",
"orig": "\u301c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 105,
"label": "text",
"bbox": {
"l": 114.4,
"t": 271.5,
"r": 122.1,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 114.4,
"r_y0": 275.9,
"r_x1": 122.1,
"r_y1": 275.9,
"r_x2": 122.1,
"r_y2": 271.5,
"r_x3": 114.4,
"r_y3": 271.5,
"coord_origin": "TOPLEFT"
},
"text": "155",
"orig": "155",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 106,
"label": "text",
"bbox": {
"l": 122.1,
"t": 271.7,
"r": 127.3,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.1,
"r_y0": 275.9,
"r_x1": 127.3,
"r_y1": 275.9,
"r_x2": 127.3,
"r_y2": 271.7,
"r_x3": 122.1,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u56de",
"orig": "\u56de",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 107,
"label": "text",
"bbox": {
"l": 184.4,
"t": 270.8,
"r": 189.6,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 275.1,
"r_x1": 189.6,
"r_y1": 275.1,
"r_x2": 189.6,
"r_y2": 270.8,
"r_x3": 184.4,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "98",
"orig": "98",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 108,
"label": "text",
"bbox": {
"l": 210.3,
"t": 270.8,
"r": 212.9,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 275.1,
"r_x1": 212.9,
"r_y1": 275.1,
"r_x2": 212.9,
"r_y2": 270.8,
"r_x3": 210.3,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 109,
"label": "text",
"bbox": {
"l": 233.6,
"t": 270.8,
"r": 238.8,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.6,
"r_y0": 275.1,
"r_x1": 238.8,
"r_y1": 275.1,
"r_x2": 238.8,
"r_y2": 270.8,
"r_x3": 233.6,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 110,
"label": "text",
"bbox": {
"l": 256.9,
"t": 270.8,
"r": 264.6,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 275.1,
"r_x1": 264.6,
"r_y1": 275.1,
"r_x2": 264.6,
"r_y2": 270.8,
"r_x3": 256.9,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 111,
"label": "text",
"bbox": {
"l": 281.5,
"t": 270.8,
"r": 289.2,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 275.1,
"r_x1": 289.2,
"r_y1": 275.1,
"r_x2": 289.2,
"r_y2": 270.8,
"r_x3": 281.5,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "232",
"orig": "232",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 112,
"label": "text",
"bbox": {
"l": 55.5,
"t": 279.0,
"r": 68.7,
"b": 283.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 283.4,
"r_x1": 68.7,
"r_y1": 283.4,
"r_x2": 68.7,
"r_y2": 279.0,
"r_x3": 55.5,
"r_y3": 279.0,
"coord_origin": "TOPLEFT"
},
"text": "WWW",
"orig": "WWW",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 113,
"label": "text",
"bbox": {
"l": 68.7,
"t": 279.2,
"r": 110.2,
"b": 283.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.7,
"r_y0": 283.4,
"r_x1": 110.2,
"r_y1": 283.4,
"r_x2": 110.2,
"r_y2": 279.2,
"r_x3": 68.7,
"r_y3": 279.2,
"coord_origin": "TOPLEFT"
},
"text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 114,
"label": "text",
"bbox": {
"l": 183.1,
"t": 278.0,
"r": 190.9,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 282.3,
"r_x1": 190.9,
"r_y1": 282.3,
"r_x2": 190.9,
"r_y2": 278.0,
"r_x3": 183.1,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "107",
"orig": "107",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 115,
"label": "text",
"bbox": {
"l": 209.0,
"t": 278.0,
"r": 214.2,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 282.3,
"r_x1": 214.2,
"r_y1": 282.3,
"r_x2": 214.2,
"r_y2": 278.0,
"r_x3": 209.0,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "73",
"orig": "73",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 116,
"label": "text",
"bbox": {
"l": 233.6,
"t": 278.0,
"r": 238.8,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.6,
"r_y0": 282.3,
"r_x1": 238.8,
"r_y1": 282.3,
"r_x2": 238.8,
"r_y2": 278.0,
"r_x3": 233.6,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 117,
"label": "text",
"bbox": {
"l": 256.9,
"t": 278.0,
"r": 264.6,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 282.3,
"r_x1": 264.6,
"r_y1": 282.3,
"r_x2": 264.6,
"r_y2": 278.0,
"r_x3": 256.9,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 118,
"label": "text",
"bbox": {
"l": 282.8,
"t": 278.0,
"r": 287.9,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 282.8,
"r_y0": 282.3,
"r_x1": 287.9,
"r_y1": 282.3,
"r_x2": 287.9,
"r_y2": 278.0,
"r_x3": 282.8,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 119,
"label": "text",
"bbox": {
"l": 169.6,
"t": 286.5,
"r": 174.8,
"b": 290.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 169.6,
"r_y0": 290.6,
"r_x1": 174.8,
"r_y1": 290.6,
"r_x2": 174.8,
"r_y2": 286.5,
"r_x3": 169.6,
"r_y3": 286.5,
"coord_origin": "TOPLEFT"
},
"text": "\u8a08",
"orig": "\u8a08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 120,
"label": "text",
"bbox": {
"l": 183.1,
"t": 285.5,
"r": 190.9,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 289.8,
"r_x1": 190.9,
"r_y1": 289.8,
"r_x2": 190.9,
"r_y2": 285.5,
"r_x3": 183.1,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "945",
"orig": "945",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 121,
"label": "text",
"bbox": {
"l": 207.7,
"t": 285.5,
"r": 215.4,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 289.8,
"r_x1": 215.4,
"r_y1": 289.8,
"r_x2": 215.4,
"r_y2": 285.5,
"r_x3": 207.7,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "294",
"orig": "294",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 122,
"label": "text",
"bbox": {
"l": 232.3,
"t": 285.5,
"r": 240.0,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 289.8,
"r_x1": 240.0,
"r_y1": 289.8,
"r_x2": 240.0,
"r_y2": 285.5,
"r_x3": 232.3,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "651",
"orig": "651",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 123,
"label": "text",
"bbox": {
"l": 255.8,
"t": 285.5,
"r": 265.8,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.8,
"r_y0": 289.8,
"r_x1": 265.8,
"r_y1": 289.8,
"r_x2": 265.8,
"r_y2": 285.5,
"r_x3": 255.8,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "1122",
"orig": "1122",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 124,
"label": "text",
"bbox": {
"l": 281.5,
"t": 285.5,
"r": 289.2,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 289.8,
"r_x1": 289.2,
"r_y1": 289.8,
"r_x2": 289.2,
"r_y2": 285.5,
"r_x3": 281.5,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "955",
"orig": "955",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 16,
"label": "caption",
"bbox": {
"l": 380.4,
"t": 292.3,
"r": 549.4,
"b": 298.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.75,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 380.4,
"r_y0": 298.6,
"r_x1": 549.4,
"r_y1": 298.6,
"r_x2": 549.4,
"r_y2": 292.3,
"r_x3": 380.4,
"r_y3": 292.3,
"coord_origin": "TOPLEFT"
},
"text": "Text is aligned to match original for ease of viewing",
"orig": "Text is aligned to match original for ease of viewing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 7,
"label": "table",
"bbox": {
"l": 304.9,
"t": 218.5,
"r": 550.2,
"b": 287.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.0,
"r_y0": 226.7,
"r_x1": 542.0,
"r_y1": 226.7,
"r_x2": 542.0,
"r_y2": 221.6,
"r_x3": 459.0,
"r_y3": 221.6,
"coord_origin": "TOPLEFT"
},
"text": "Weighted Average Grant Date Fair",
"orig": "Weighted Average Grant Date Fair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.8,
"r_y0": 232.9,
"r_x1": 507.2,
"r_y1": 232.9,
"r_x2": 507.2,
"r_y2": 227.8,
"r_x3": 493.8,
"r_y3": 227.8,
"coord_origin": "TOPLEFT"
},
"text": "Value",
"orig": "Value",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.2,
"r_y0": 241.8,
"r_x1": 400.7,
"r_y1": 241.8,
"r_x2": 400.7,
"r_y2": 236.7,
"r_x3": 393.2,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "RS",
"orig": "RS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 241.8,
"r_x1": 404.6,
"r_y1": 241.8,
"r_x2": 404.6,
"r_y2": 236.7,
"r_x3": 400.7,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "U",
"orig": "U",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 404.6,
"r_y0": 241.8,
"r_x1": 407.3,
"r_y1": 241.8,
"r_x2": 407.3,
"r_y2": 236.7,
"r_x3": 404.6,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "s",
"orig": "s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 392.1,
"r_y0": 226.6,
"r_x1": 438.0,
"r_y1": 226.6,
"r_x2": 438.0,
"r_y2": 221.6,
"r_x3": 392.1,
"r_y3": 221.6,
"coord_origin": "TOPLEFT"
},
"text": "Shares (in millions)",
"orig": "Shares (in millions)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.2,
"r_y0": 241.8,
"r_x1": 441.0,
"r_y1": 241.8,
"r_x2": 441.0,
"r_y2": 236.7,
"r_x3": 427.2,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.4,
"r_y0": 241.8,
"r_x1": 482.5,
"r_y1": 241.8,
"r_x2": 482.5,
"r_y2": 236.7,
"r_x3": 468.4,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "RSUs",
"orig": "RSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.9,
"r_y0": 241.8,
"r_x1": 530.7,
"r_y1": 241.8,
"r_x2": 530.7,
"r_y2": 236.7,
"r_x3": 516.9,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 249.7,
"r_x1": 355.7,
"r_y1": 249.7,
"r_x2": 355.7,
"r_y2": 244.6,
"r_x3": 306.1,
"r_y3": 244.6,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on Janua",
"orig": "Nonvested on Janua",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 355.7,
"r_y0": 249.7,
"r_x1": 364.7,
"r_y1": 249.7,
"r_x2": 364.7,
"r_y2": 244.6,
"r_x3": 355.7,
"r_y3": 244.6,
"coord_origin": "TOPLEFT"
},
"text": "ry 1",
"orig": "ry 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 250.0,
"r_x1": 400.8,
"r_y1": 250.0,
"r_x2": 400.8,
"r_y2": 244.9,
"r_x3": 396.2,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.8,
"r_y0": 250.0,
"r_x1": 403.8,
"r_y1": 250.0,
"r_x2": 403.8,
"r_y2": 244.9,
"r_x3": 400.8,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.8,
"r_y0": 250.0,
"r_x1": 437.3,
"r_y1": 250.0,
"r_x2": 437.3,
"r_y2": 244.9,
"r_x3": 429.8,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.5,
"r_y0": 250.0,
"r_x1": 478.4,
"r_y1": 250.0,
"r_x2": 478.4,
"r_y2": 244.9,
"r_x3": 465.5,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "90.10",
"orig": "90.10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 481.0,
"r_y0": 250.0,
"r_x1": 483.6,
"r_y1": 250.0,
"r_x2": 483.6,
"r_y2": 244.9,
"r_x3": 481.0,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "$",
"orig": "$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.4,
"r_y0": 250.0,
"r_x1": 531.5,
"r_y1": 250.0,
"r_x2": 531.5,
"r_y2": 244.9,
"r_x3": 513.4,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "$ 91.19",
"orig": "$ 91.19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 258.7,
"r_x1": 325.6,
"r_y1": 258.7,
"r_x2": 325.6,
"r_y2": 253.7,
"r_x3": 306.1,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Granted",
"orig": "Granted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 258.7,
"r_x1": 400.8,
"r_y1": 258.7,
"r_x2": 400.8,
"r_y2": 253.7,
"r_x3": 396.2,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "0.",
"orig": "0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.8,
"r_y0": 258.7,
"r_x1": 403.8,
"r_y1": 258.7,
"r_x2": 403.8,
"r_y2": 253.7,
"r_x3": 400.8,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.8,
"r_y0": 258.7,
"r_x1": 437.3,
"r_y1": 258.7,
"r_x2": 437.3,
"r_y2": 253.7,
"r_x3": 429.8,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "0.1",
"orig": "0.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.4,
"r_y0": 258.7,
"r_x1": 482.5,
"r_y1": 258.7,
"r_x2": 482.5,
"r_y2": 253.7,
"r_x3": 466.4,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "117.44",
"orig": "117.44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.3,
"r_y0": 258.7,
"r_x1": 530.8,
"r_y1": 258.7,
"r_x2": 530.8,
"r_y2": 253.7,
"r_x3": 514.3,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "122.41",
"orig": "122.41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 266.6,
"r_x1": 322.6,
"r_y1": 266.6,
"r_x2": 322.6,
"r_y2": 261.5,
"r_x3": 306.1,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "Vested",
"orig": "Vested",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.4,
"r_y0": 266.6,
"r_x1": 400.7,
"r_y1": 266.6,
"r_x2": 400.7,
"r_y2": 261.5,
"r_x3": 394.4,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 266.6,
"r_x1": 403.7,
"r_y1": 266.6,
"r_x2": 403.7,
"r_y2": 261.5,
"r_x3": 400.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.7,
"r_y0": 266.6,
"r_x1": 405.5,
"r_y1": 266.6,
"r_x2": 405.5,
"r_y2": 261.5,
"r_x3": 403.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.7,
"r_y0": 266.6,
"r_x1": 438.8,
"r_y1": 266.6,
"r_x2": 438.8,
"r_y2": 261.5,
"r_x3": 427.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "(0.1)",
"orig": "(0.1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.6,
"r_y0": 266.6,
"r_x1": 482.1,
"r_y1": 266.6,
"r_x2": 482.1,
"r_y2": 261.5,
"r_x3": 468.6,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "87.08",
"orig": "87.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.0,
"r_y0": 266.6,
"r_x1": 529.5,
"r_y1": 266.6,
"r_x2": 529.5,
"r_y2": 261.5,
"r_x3": 516.0,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "81.14",
"orig": "81.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 274.7,
"r_x1": 356.2,
"r_y1": 274.7,
"r_x2": 356.2,
"r_y2": 269.6,
"r_x3": 306.1,
"r_y3": 269.6,
"coord_origin": "TOPLEFT"
},
"text": "Canceled or forfeited",
"orig": "Canceled or forfeited",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.4,
"r_y0": 275.4,
"r_x1": 400.7,
"r_y1": 275.4,
"r_x2": 400.7,
"r_y2": 270.3,
"r_x3": 394.4,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 275.4,
"r_x1": 403.7,
"r_y1": 275.4,
"r_x2": 403.7,
"r_y2": 270.3,
"r_x3": 400.7,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.7,
"r_y0": 275.4,
"r_x1": 405.5,
"r_y1": 275.4,
"r_x2": 405.5,
"r_y2": 270.3,
"r_x3": 403.7,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.0,
"r_y0": 275.4,
"r_x1": 436.4,
"r_y1": 275.4,
"r_x2": 436.4,
"r_y2": 270.3,
"r_x3": 431.0,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.8,
"r_y0": 275.4,
"r_x1": 482.4,
"r_y1": 275.4,
"r_x2": 482.4,
"r_y2": 270.3,
"r_x3": 465.8,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "102.01",
"orig": "102.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.0,
"r_y0": 275.4,
"r_x1": 529.5,
"r_y1": 275.4,
"r_x2": 529.5,
"r_y2": 270.3,
"r_x3": 516.0,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "92.18",
"orig": "92.18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 283.6,
"r_x1": 373.4,
"r_y1": 283.6,
"r_x2": 373.4,
"r_y2": 278.5,
"r_x3": 306.1,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on December 31",
"orig": "Nonvested on December 31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 283.6,
"r_x1": 403.8,
"r_y1": 283.6,
"r_x2": 403.8,
"r_y2": 278.5,
"r_x3": 396.2,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "1.0",
"orig": "1.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.5,
"r_y0": 283.6,
"r_x1": 437.0,
"r_y1": 283.6,
"r_x2": 437.0,
"r_y2": 278.5,
"r_x3": 429.5,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.7,
"r_y0": 283.6,
"r_x1": 484.7,
"r_y1": 283.6,
"r_x2": 484.7,
"r_y2": 278.5,
"r_x3": 463.7,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "104.85 $",
"orig": "104.85 $",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.0,
"r_y0": 283.6,
"r_x1": 534.0,
"r_y1": 283.6,
"r_x2": 534.0,
"r_y2": 278.5,
"r_x3": 513.0,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "$ 104.51",
"orig": "$ 104.51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 125,
"label": "text",
"bbox": {
"l": 459.0,
"t": 221.6,
"r": 542.0,
"b": 226.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.0,
"r_y0": 226.7,
"r_x1": 542.0,
"r_y1": 226.7,
"r_x2": 542.0,
"r_y2": 221.6,
"r_x3": 459.0,
"r_y3": 221.6,
"coord_origin": "TOPLEFT"
},
"text": "Weighted Average Grant Date Fair",
"orig": "Weighted Average Grant Date Fair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 126,
"label": "text",
"bbox": {
"l": 493.8,
"t": 227.8,
"r": 507.2,
"b": 232.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.8,
"r_y0": 232.9,
"r_x1": 507.2,
"r_y1": 232.9,
"r_x2": 507.2,
"r_y2": 227.8,
"r_x3": 493.8,
"r_y3": 227.8,
"coord_origin": "TOPLEFT"
},
"text": "Value",
"orig": "Value",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 127,
"label": "text",
"bbox": {
"l": 393.2,
"t": 236.7,
"r": 400.7,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.2,
"r_y0": 241.8,
"r_x1": 400.7,
"r_y1": 241.8,
"r_x2": 400.7,
"r_y2": 236.7,
"r_x3": 393.2,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "RS",
"orig": "RS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 128,
"label": "text",
"bbox": {
"l": 400.7,
"t": 236.7,
"r": 404.6,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 241.8,
"r_x1": 404.6,
"r_y1": 241.8,
"r_x2": 404.6,
"r_y2": 236.7,
"r_x3": 400.7,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "U",
"orig": "U",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 129,
"label": "text",
"bbox": {
"l": 404.6,
"t": 236.7,
"r": 407.3,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 404.6,
"r_y0": 241.8,
"r_x1": 407.3,
"r_y1": 241.8,
"r_x2": 407.3,
"r_y2": 236.7,
"r_x3": 404.6,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "s",
"orig": "s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 130,
"label": "text",
"bbox": {
"l": 392.1,
"t": 221.6,
"r": 438.0,
"b": 226.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 392.1,
"r_y0": 226.6,
"r_x1": 438.0,
"r_y1": 226.6,
"r_x2": 438.0,
"r_y2": 221.6,
"r_x3": 392.1,
"r_y3": 221.6,
"coord_origin": "TOPLEFT"
},
"text": "Shares (in millions)",
"orig": "Shares (in millions)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 131,
"label": "text",
"bbox": {
"l": 427.2,
"t": 236.7,
"r": 441.0,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.2,
"r_y0": 241.8,
"r_x1": 441.0,
"r_y1": 241.8,
"r_x2": 441.0,
"r_y2": 236.7,
"r_x3": 427.2,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 132,
"label": "text",
"bbox": {
"l": 468.4,
"t": 236.7,
"r": 482.5,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.4,
"r_y0": 241.8,
"r_x1": 482.5,
"r_y1": 241.8,
"r_x2": 482.5,
"r_y2": 236.7,
"r_x3": 468.4,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "RSUs",
"orig": "RSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 133,
"label": "text",
"bbox": {
"l": 516.9,
"t": 236.7,
"r": 530.7,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.9,
"r_y0": 241.8,
"r_x1": 530.7,
"r_y1": 241.8,
"r_x2": 530.7,
"r_y2": 236.7,
"r_x3": 516.9,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 134,
"label": "text",
"bbox": {
"l": 306.1,
"t": 244.6,
"r": 355.7,
"b": 249.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 249.7,
"r_x1": 355.7,
"r_y1": 249.7,
"r_x2": 355.7,
"r_y2": 244.6,
"r_x3": 306.1,
"r_y3": 244.6,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on Janua",
"orig": "Nonvested on Janua",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 135,
"label": "text",
"bbox": {
"l": 355.7,
"t": 244.6,
"r": 364.7,
"b": 249.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 355.7,
"r_y0": 249.7,
"r_x1": 364.7,
"r_y1": 249.7,
"r_x2": 364.7,
"r_y2": 244.6,
"r_x3": 355.7,
"r_y3": 244.6,
"coord_origin": "TOPLEFT"
},
"text": "ry 1",
"orig": "ry 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 136,
"label": "text",
"bbox": {
"l": 396.2,
"t": 244.9,
"r": 400.8,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 250.0,
"r_x1": 400.8,
"r_y1": 250.0,
"r_x2": 400.8,
"r_y2": 244.9,
"r_x3": 396.2,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 137,
"label": "text",
"bbox": {
"l": 400.8,
"t": 244.9,
"r": 403.8,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.8,
"r_y0": 250.0,
"r_x1": 403.8,
"r_y1": 250.0,
"r_x2": 403.8,
"r_y2": 244.9,
"r_x3": 400.8,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 138,
"label": "text",
"bbox": {
"l": 429.8,
"t": 244.9,
"r": 437.3,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.8,
"r_y0": 250.0,
"r_x1": 437.3,
"r_y1": 250.0,
"r_x2": 437.3,
"r_y2": 244.9,
"r_x3": 429.8,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 139,
"label": "text",
"bbox": {
"l": 465.5,
"t": 244.9,
"r": 478.4,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.5,
"r_y0": 250.0,
"r_x1": 478.4,
"r_y1": 250.0,
"r_x2": 478.4,
"r_y2": 244.9,
"r_x3": 465.5,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "90.10",
"orig": "90.10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 140,
"label": "text",
"bbox": {
"l": 481.0,
"t": 244.9,
"r": 483.6,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 481.0,
"r_y0": 250.0,
"r_x1": 483.6,
"r_y1": 250.0,
"r_x2": 483.6,
"r_y2": 244.9,
"r_x3": 481.0,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "$",
"orig": "$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 141,
"label": "text",
"bbox": {
"l": 513.4,
"t": 244.9,
"r": 531.5,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.4,
"r_y0": 250.0,
"r_x1": 531.5,
"r_y1": 250.0,
"r_x2": 531.5,
"r_y2": 244.9,
"r_x3": 513.4,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "$ 91.19",
"orig": "$ 91.19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 142,
"label": "text",
"bbox": {
"l": 306.1,
"t": 253.7,
"r": 325.6,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 258.7,
"r_x1": 325.6,
"r_y1": 258.7,
"r_x2": 325.6,
"r_y2": 253.7,
"r_x3": 306.1,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Granted",
"orig": "Granted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 143,
"label": "text",
"bbox": {
"l": 396.2,
"t": 253.7,
"r": 400.8,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 258.7,
"r_x1": 400.8,
"r_y1": 258.7,
"r_x2": 400.8,
"r_y2": 253.7,
"r_x3": 396.2,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "0.",
"orig": "0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 144,
"label": "text",
"bbox": {
"l": 400.8,
"t": 253.7,
"r": 403.8,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.8,
"r_y0": 258.7,
"r_x1": 403.8,
"r_y1": 258.7,
"r_x2": 403.8,
"r_y2": 253.7,
"r_x3": 400.8,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 145,
"label": "text",
"bbox": {
"l": 429.8,
"t": 253.7,
"r": 437.3,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.8,
"r_y0": 258.7,
"r_x1": 437.3,
"r_y1": 258.7,
"r_x2": 437.3,
"r_y2": 253.7,
"r_x3": 429.8,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "0.1",
"orig": "0.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 146,
"label": "text",
"bbox": {
"l": 466.4,
"t": 253.7,
"r": 482.5,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.4,
"r_y0": 258.7,
"r_x1": 482.5,
"r_y1": 258.7,
"r_x2": 482.5,
"r_y2": 253.7,
"r_x3": 466.4,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "117.44",
"orig": "117.44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 147,
"label": "text",
"bbox": {
"l": 514.3,
"t": 253.7,
"r": 530.8,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.3,
"r_y0": 258.7,
"r_x1": 530.8,
"r_y1": 258.7,
"r_x2": 530.8,
"r_y2": 253.7,
"r_x3": 514.3,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "122.41",
"orig": "122.41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 148,
"label": "text",
"bbox": {
"l": 306.1,
"t": 261.5,
"r": 322.6,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 266.6,
"r_x1": 322.6,
"r_y1": 266.6,
"r_x2": 322.6,
"r_y2": 261.5,
"r_x3": 306.1,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "Vested",
"orig": "Vested",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 149,
"label": "text",
"bbox": {
"l": 394.4,
"t": 261.5,
"r": 400.7,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.4,
"r_y0": 266.6,
"r_x1": 400.7,
"r_y1": 266.6,
"r_x2": 400.7,
"r_y2": 261.5,
"r_x3": 394.4,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 150,
"label": "text",
"bbox": {
"l": 400.7,
"t": 261.5,
"r": 403.7,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 266.6,
"r_x1": 403.7,
"r_y1": 266.6,
"r_x2": 403.7,
"r_y2": 261.5,
"r_x3": 400.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 151,
"label": "text",
"bbox": {
"l": 403.7,
"t": 261.5,
"r": 405.5,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.7,
"r_y0": 266.6,
"r_x1": 405.5,
"r_y1": 266.6,
"r_x2": 405.5,
"r_y2": 261.5,
"r_x3": 403.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 152,
"label": "text",
"bbox": {
"l": 427.7,
"t": 261.5,
"r": 438.8,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.7,
"r_y0": 266.6,
"r_x1": 438.8,
"r_y1": 266.6,
"r_x2": 438.8,
"r_y2": 261.5,
"r_x3": 427.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "(0.1)",
"orig": "(0.1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 153,
"label": "text",
"bbox": {
"l": 468.6,
"t": 261.5,
"r": 482.1,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.6,
"r_y0": 266.6,
"r_x1": 482.1,
"r_y1": 266.6,
"r_x2": 482.1,
"r_y2": 261.5,
"r_x3": 468.6,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "87.08",
"orig": "87.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 154,
"label": "text",
"bbox": {
"l": 516.0,
"t": 261.5,
"r": 529.5,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.0,
"r_y0": 266.6,
"r_x1": 529.5,
"r_y1": 266.6,
"r_x2": 529.5,
"r_y2": 261.5,
"r_x3": 516.0,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "81.14",
"orig": "81.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 155,
"label": "text",
"bbox": {
"l": 306.1,
"t": 269.6,
"r": 356.2,
"b": 274.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 274.7,
"r_x1": 356.2,
"r_y1": 274.7,
"r_x2": 356.2,
"r_y2": 269.6,
"r_x3": 306.1,
"r_y3": 269.6,
"coord_origin": "TOPLEFT"
},
"text": "Canceled or forfeited",
"orig": "Canceled or forfeited",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 156,
"label": "text",
"bbox": {
"l": 394.4,
"t": 270.3,
"r": 400.7,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.4,
"r_y0": 275.4,
"r_x1": 400.7,
"r_y1": 275.4,
"r_x2": 400.7,
"r_y2": 270.3,
"r_x3": 394.4,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 157,
"label": "text",
"bbox": {
"l": 400.7,
"t": 270.3,
"r": 403.7,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 275.4,
"r_x1": 403.7,
"r_y1": 275.4,
"r_x2": 403.7,
"r_y2": 270.3,
"r_x3": 400.7,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 158,
"label": "text",
"bbox": {
"l": 403.7,
"t": 270.3,
"r": 405.5,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.7,
"r_y0": 275.4,
"r_x1": 405.5,
"r_y1": 275.4,
"r_x2": 405.5,
"r_y2": 270.3,
"r_x3": 403.7,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 159,
"label": "text",
"bbox": {
"l": 431.0,
"t": 270.3,
"r": 436.4,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.0,
"r_y0": 275.4,
"r_x1": 436.4,
"r_y1": 275.4,
"r_x2": 436.4,
"r_y2": 270.3,
"r_x3": 431.0,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 160,
"label": "text",
"bbox": {
"l": 465.8,
"t": 270.3,
"r": 482.4,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.8,
"r_y0": 275.4,
"r_x1": 482.4,
"r_y1": 275.4,
"r_x2": 482.4,
"r_y2": 270.3,
"r_x3": 465.8,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "102.01",
"orig": "102.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 161,
"label": "text",
"bbox": {
"l": 516.0,
"t": 270.3,
"r": 529.5,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.0,
"r_y0": 275.4,
"r_x1": 529.5,
"r_y1": 275.4,
"r_x2": 529.5,
"r_y2": 270.3,
"r_x3": 516.0,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "92.18",
"orig": "92.18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 162,
"label": "text",
"bbox": {
"l": 306.1,
"t": 278.5,
"r": 373.4,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 283.6,
"r_x1": 373.4,
"r_y1": 283.6,
"r_x2": 373.4,
"r_y2": 278.5,
"r_x3": 306.1,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on December 31",
"orig": "Nonvested on December 31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 163,
"label": "text",
"bbox": {
"l": 396.2,
"t": 278.5,
"r": 403.8,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 283.6,
"r_x1": 403.8,
"r_y1": 283.6,
"r_x2": 403.8,
"r_y2": 278.5,
"r_x3": 396.2,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "1.0",
"orig": "1.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 164,
"label": "text",
"bbox": {
"l": 429.5,
"t": 278.5,
"r": 437.0,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.5,
"r_y0": 283.6,
"r_x1": 437.0,
"r_y1": 283.6,
"r_x2": 437.0,
"r_y2": 278.5,
"r_x3": 429.5,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 165,
"label": "text",
"bbox": {
"l": 463.7,
"t": 278.5,
"r": 484.7,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.7,
"r_y0": 283.6,
"r_x1": 484.7,
"r_y1": 283.6,
"r_x2": 484.7,
"r_y2": 278.5,
"r_x3": 463.7,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "104.85 $",
"orig": "104.85 $",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 166,
"label": "text",
"bbox": {
"l": 513.0,
"t": 278.5,
"r": 534.0,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.0,
"r_y0": 283.6,
"r_x1": 534.0,
"r_y1": 283.6,
"r_x2": 534.0,
"r_y2": 278.5,
"r_x3": 513.0,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "$ 104.51",
"orig": "$ 104.51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 6,
"label": "caption",
"bbox": {
"l": 50.1,
"t": 320.9,
"r": 545.1,
"b": 365.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 329.8,
"r_x1": 86.9,
"r_y1": 329.8,
"r_x2": 86.9,
"r_y2": 320.9,
"r_x3": 50.1,
"r_y3": 320.9,
"coord_origin": "TOPLEFT"
},
"text": "Figure 5:",
"orig": "Figure 5:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.9,
"r_y0": 329.8,
"r_x1": 545.1,
"r_y1": 329.8,
"r_x2": 545.1,
"r_y2": 320.9,
"r_x3": 93.9,
"r_y3": 320.9,
"coord_origin": "TOPLEFT"
},
"text": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration",
"orig": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 341.7,
"r_x1": 545.1,
"r_y1": 341.7,
"r_x2": 545.1,
"r_y2": 332.8,
"r_x3": 50.1,
"r_y3": 332.8,
"coord_origin": "TOPLEFT"
},
"text": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is",
"orig": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 353.7,
"r_x1": 545.1,
"r_y1": 353.7,
"r_x2": 545.1,
"r_y2": 344.8,
"r_x3": 50.1,
"r_y3": 344.8,
"coord_origin": "TOPLEFT"
},
"text": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from",
"orig": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 365.6,
"r_x1": 139.8,
"r_y1": 365.6,
"r_x2": 139.8,
"r_y2": 356.7,
"r_x3": 50.1,
"r_y3": 356.7,
"coord_origin": "TOPLEFT"
},
"text": "the FinTabNet dataset.",
"orig": "the FinTabNet dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 12,
"label": "picture",
"bbox": {
"l": 216.8,
"t": 380.5,
"r": 375.8,
"b": 443.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.81,
"cells": [
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.3,
"r_y0": 386.4,
"r_x1": 342.1,
"r_y1": 386.4,
"r_x2": 342.1,
"r_y2": 381.8,
"r_x3": 220.3,
"r_y3": 381.8,
"coord_origin": "TOPLEFT"
},
"text": "Red - PDF cells, Green - predicted bounding boxes",
"orig": "Red - PDF cells, Green - predicted bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 167,
"label": "text",
"bbox": {
"l": 220.3,
"t": 381.8,
"r": 342.1,
"b": 386.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.3,
"r_y0": 386.4,
"r_x1": 342.1,
"r_y1": 386.4,
"r_x2": 342.1,
"r_y2": 381.8,
"r_x3": 220.3,
"r_y3": 381.8,
"coord_origin": "TOPLEFT"
},
"text": "Red - PDF cells, Green - predicted bounding boxes",
"orig": "Red - PDF cells, Green - predicted bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 11,
"label": "picture",
"bbox": {
"l": 51.7,
"t": 380.5,
"r": 211.8,
"b": 443.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.83,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.7,
"r_y0": 386.4,
"r_x1": 85.7,
"r_y1": 386.4,
"r_x2": 85.7,
"r_y2": 381.8,
"r_x3": 53.7,
"r_y3": 381.8,
"coord_origin": "TOPLEFT"
},
"text": "Ground Truth",
"orig": "Ground Truth",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 168,
"label": "text",
"bbox": {
"l": 53.7,
"t": 381.8,
"r": 85.7,
"b": 386.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.7,
"r_y0": 386.4,
"r_x1": 85.7,
"r_y1": 386.4,
"r_x2": 85.7,
"r_y2": 381.8,
"r_x3": 53.7,
"r_y3": 381.8,
"coord_origin": "TOPLEFT"
},
"text": "Ground Truth",
"orig": "Ground Truth",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 13,
"label": "picture",
"bbox": {
"l": 383.1,
"t": 381.2,
"r": 542.1,
"b": 442.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.79,
"cells": [
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 406.9,
"r_x1": 443.7,
"r_y1": 406.9,
"r_x2": 443.7,
"r_y2": 400.6,
"r_x3": 437.4,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 406.9,
"r_x1": 456.7,
"r_y1": 406.9,
"r_x2": 456.7,
"r_y2": 400.6,
"r_x3": 450.3,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 406.9,
"r_x1": 469.6,
"r_y1": 406.9,
"r_x2": 469.6,
"r_y2": 400.6,
"r_x3": 463.3,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 406.9,
"r_x1": 482.6,
"r_y1": 406.9,
"r_x2": 482.6,
"r_y2": 400.6,
"r_x3": 476.2,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 406.9,
"r_x1": 495.5,
"r_y1": 406.9,
"r_x2": 495.5,
"r_y2": 400.6,
"r_x3": 489.2,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 406.9,
"r_x1": 508.5,
"r_y1": 406.9,
"r_x2": 508.5,
"r_y2": 400.6,
"r_x3": 502.1,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "21",
"orig": "21",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 406.9,
"r_x1": 521.4,
"r_y1": 406.9,
"r_x2": 521.4,
"r_y2": 400.6,
"r_x3": 515.1,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "22",
"orig": "22",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 417.4,
"r_x1": 391.6,
"r_y1": 417.4,
"r_x2": 391.6,
"r_y2": 411.0,
"r_x3": 385.3,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "23",
"orig": "23",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 417.4,
"r_x1": 404.8,
"r_y1": 417.4,
"r_x2": 404.8,
"r_y2": 411.0,
"r_x3": 398.5,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "24",
"orig": "24",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 417.4,
"r_x1": 417.8,
"r_y1": 417.4,
"r_x2": 417.8,
"r_y2": 411.0,
"r_x3": 411.5,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "25",
"orig": "25",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 417.4,
"r_x1": 443.7,
"r_y1": 417.4,
"r_x2": 443.7,
"r_y2": 411.0,
"r_x3": 437.4,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "26",
"orig": "26",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 417.4,
"r_x1": 456.7,
"r_y1": 417.4,
"r_x2": 456.7,
"r_y2": 411.0,
"r_x3": 450.3,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "27",
"orig": "27",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 417.4,
"r_x1": 469.6,
"r_y1": 417.4,
"r_x2": 469.6,
"r_y2": 411.0,
"r_x3": 463.3,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "28",
"orig": "28",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 427.4,
"r_x1": 391.6,
"r_y1": 427.4,
"r_x2": 391.6,
"r_y2": 421.1,
"r_x3": 385.3,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 427.4,
"r_x1": 404.8,
"r_y1": 427.4,
"r_x2": 404.8,
"r_y2": 421.1,
"r_x3": 398.5,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "31",
"orig": "31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 427.4,
"r_x1": 417.8,
"r_y1": 427.4,
"r_x2": 417.8,
"r_y2": 421.1,
"r_x3": 411.5,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "32",
"orig": "32",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 427.4,
"r_x1": 430.7,
"r_y1": 427.4,
"r_x2": 430.7,
"r_y2": 421.1,
"r_x3": 424.4,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "33",
"orig": "33",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 427.4,
"r_x1": 443.7,
"r_y1": 427.4,
"r_x2": 443.7,
"r_y2": 421.1,
"r_x3": 437.4,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 427.4,
"r_x1": 456.7,
"r_y1": 427.4,
"r_x2": 456.7,
"r_y2": 421.1,
"r_x3": 450.3,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "35",
"orig": "35",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 427.4,
"r_x1": 469.6,
"r_y1": 427.4,
"r_x2": 469.6,
"r_y2": 421.1,
"r_x3": 463.3,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "36",
"orig": "36",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 427.4,
"r_x1": 482.6,
"r_y1": 427.4,
"r_x2": 482.6,
"r_y2": 421.1,
"r_x3": 476.2,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "37",
"orig": "37",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 427.4,
"r_x1": 495.5,
"r_y1": 427.4,
"r_x2": 495.5,
"r_y2": 421.1,
"r_x3": 489.2,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "38",
"orig": "38",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 427.4,
"r_x1": 508.5,
"r_y1": 427.4,
"r_x2": 508.5,
"r_y2": 421.1,
"r_x3": 502.1,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "39",
"orig": "39",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 427.4,
"r_x1": 521.4,
"r_y1": 427.4,
"r_x2": 521.4,
"r_y2": 421.1,
"r_x3": 515.1,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.0,
"r_y0": 427.4,
"r_x1": 534.4,
"r_y1": 427.4,
"r_x2": 534.4,
"r_y2": 421.1,
"r_x3": 528.0,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "41",
"orig": "41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 438.4,
"r_x1": 391.6,
"r_y1": 438.4,
"r_x2": 391.6,
"r_y2": 432.0,
"r_x3": 385.3,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "42",
"orig": "42",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 438.4,
"r_x1": 404.8,
"r_y1": 438.4,
"r_x2": 404.8,
"r_y2": 432.0,
"r_x3": 398.5,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "43",
"orig": "43",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 438.4,
"r_x1": 417.8,
"r_y1": 438.4,
"r_x2": 417.8,
"r_y2": 432.0,
"r_x3": 411.5,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "44",
"orig": "44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 438.4,
"r_x1": 430.7,
"r_y1": 438.4,
"r_x2": 430.7,
"r_y2": 432.0,
"r_x3": 424.4,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "45",
"orig": "45",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 438.4,
"r_x1": 443.7,
"r_y1": 438.4,
"r_x2": 443.7,
"r_y2": 432.0,
"r_x3": 437.4,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "46",
"orig": "46",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 438.4,
"r_x1": 456.7,
"r_y1": 438.4,
"r_x2": 456.7,
"r_y2": 432.0,
"r_x3": 450.3,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "47",
"orig": "47",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 438.4,
"r_x1": 469.6,
"r_y1": 438.4,
"r_x2": 469.6,
"r_y2": 432.0,
"r_x3": 463.3,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "48",
"orig": "48",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 438.4,
"r_x1": 482.6,
"r_y1": 438.4,
"r_x2": 482.6,
"r_y2": 432.0,
"r_x3": 476.2,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "49",
"orig": "49",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 438.4,
"r_x1": 495.5,
"r_y1": 438.4,
"r_x2": 495.5,
"r_y2": 432.0,
"r_x3": 489.2,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 438.4,
"r_x1": 508.5,
"r_y1": 438.4,
"r_x2": 508.5,
"r_y2": 432.0,
"r_x3": 502.1,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "51",
"orig": "51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 438.4,
"r_x1": 521.4,
"r_y1": 438.4,
"r_x2": 521.4,
"r_y2": 432.0,
"r_x3": 515.1,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "52",
"orig": "52",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.0,
"r_y0": 438.4,
"r_x1": 534.4,
"r_y1": 438.4,
"r_x2": 534.4,
"r_y2": 432.0,
"r_x3": 528.0,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "53",
"orig": "53",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 395.5,
"r_x1": 388.4,
"r_y1": 395.5,
"r_x2": 388.4,
"r_y2": 389.2,
"r_x3": 385.3,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 395.5,
"r_x1": 401.7,
"r_y1": 395.5,
"r_x2": 401.7,
"r_y2": 389.2,
"r_x3": 398.5,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 395.5,
"r_x1": 414.6,
"r_y1": 395.5,
"r_x2": 414.6,
"r_y2": 389.2,
"r_x3": 411.5,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 395.5,
"r_x1": 427.6,
"r_y1": 395.5,
"r_x2": 427.6,
"r_y2": 389.2,
"r_x3": 424.4,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 395.5,
"r_x1": 440.5,
"r_y1": 395.5,
"r_x2": 440.5,
"r_y2": 389.2,
"r_x3": 437.4,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 395.5,
"r_x1": 453.5,
"r_y1": 395.5,
"r_x2": 453.5,
"r_y2": 389.2,
"r_x3": 450.3,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 395.5,
"r_x1": 466.4,
"r_y1": 395.5,
"r_x2": 466.4,
"r_y2": 389.2,
"r_x3": 463.3,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 395.5,
"r_x1": 479.4,
"r_y1": 395.5,
"r_x2": 479.4,
"r_y2": 389.2,
"r_x3": 476.2,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 395.5,
"r_x1": 492.3,
"r_y1": 395.5,
"r_x2": 492.3,
"r_y2": 389.2,
"r_x3": 489.2,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 395.5,
"r_x1": 505.3,
"r_y1": 395.5,
"r_x2": 505.3,
"r_y2": 389.2,
"r_x3": 502.1,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 395.5,
"r_x1": 521.4,
"r_y1": 395.5,
"r_x2": 521.4,
"r_y2": 389.2,
"r_x3": 515.1,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.0,
"r_y0": 395.5,
"r_x1": 534.1,
"r_y1": 395.5,
"r_x2": 534.1,
"r_y2": 389.2,
"r_x3": 528.0,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 405.3,
"r_x1": 391.6,
"r_y1": 405.3,
"r_x2": 391.6,
"r_y2": 399.0,
"r_x3": 385.3,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 405.3,
"r_x1": 404.8,
"r_y1": 405.3,
"r_x2": 404.8,
"r_y2": 399.0,
"r_x3": 398.5,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 405.3,
"r_x1": 417.8,
"r_y1": 405.3,
"r_x2": 417.8,
"r_y2": 399.0,
"r_x3": 411.5,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 413.1,
"r_x1": 430.7,
"r_y1": 413.1,
"r_x2": 430.7,
"r_y2": 406.8,
"r_x3": 424.4,
"r_y3": 406.8,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.9,
"r_y0": 417.3,
"r_x1": 509.2,
"r_y1": 417.3,
"r_x2": 509.2,
"r_y2": 411.0,
"r_x3": 502.9,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "29",
"orig": "29",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.4,
"r_y0": 386.4,
"r_x1": 431.0,
"r_y1": 386.4,
"r_x2": 431.0,
"r_y2": 381.8,
"r_x3": 384.4,
"r_y3": 381.8,
"coord_origin": "TOPLEFT"
},
"text": "Predicted Structure",
"orig": "Predicted Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 169,
"label": "text",
"bbox": {
"l": 437.4,
"t": 400.6,
"r": 443.7,
"b": 406.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 406.9,
"r_x1": 443.7,
"r_y1": 406.9,
"r_x2": 443.7,
"r_y2": 400.6,
"r_x3": 437.4,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 170,
"label": "text",
"bbox": {
"l": 450.3,
"t": 400.6,
"r": 456.7,
"b": 406.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 406.9,
"r_x1": 456.7,
"r_y1": 406.9,
"r_x2": 456.7,
"r_y2": 400.6,
"r_x3": 450.3,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 171,
"label": "text",
"bbox": {
"l": 463.3,
"t": 400.6,
"r": 469.6,
"b": 406.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 406.9,
"r_x1": 469.6,
"r_y1": 406.9,
"r_x2": 469.6,
"r_y2": 400.6,
"r_x3": 463.3,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 172,
"label": "text",
"bbox": {
"l": 476.2,
"t": 400.6,
"r": 482.6,
"b": 406.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 406.9,
"r_x1": 482.6,
"r_y1": 406.9,
"r_x2": 482.6,
"r_y2": 400.6,
"r_x3": 476.2,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 173,
"label": "text",
"bbox": {
"l": 489.2,
"t": 400.6,
"r": 495.5,
"b": 406.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 406.9,
"r_x1": 495.5,
"r_y1": 406.9,
"r_x2": 495.5,
"r_y2": 400.6,
"r_x3": 489.2,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 174,
"label": "text",
"bbox": {
"l": 502.1,
"t": 400.6,
"r": 508.5,
"b": 406.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 406.9,
"r_x1": 508.5,
"r_y1": 406.9,
"r_x2": 508.5,
"r_y2": 400.6,
"r_x3": 502.1,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "21",
"orig": "21",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 175,
"label": "text",
"bbox": {
"l": 515.1,
"t": 400.6,
"r": 521.4,
"b": 406.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 406.9,
"r_x1": 521.4,
"r_y1": 406.9,
"r_x2": 521.4,
"r_y2": 400.6,
"r_x3": 515.1,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "22",
"orig": "22",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 176,
"label": "text",
"bbox": {
"l": 385.3,
"t": 411.0,
"r": 391.6,
"b": 417.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 417.4,
"r_x1": 391.6,
"r_y1": 417.4,
"r_x2": 391.6,
"r_y2": 411.0,
"r_x3": 385.3,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "23",
"orig": "23",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 177,
"label": "text",
"bbox": {
"l": 398.5,
"t": 411.0,
"r": 404.8,
"b": 417.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 417.4,
"r_x1": 404.8,
"r_y1": 417.4,
"r_x2": 404.8,
"r_y2": 411.0,
"r_x3": 398.5,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "24",
"orig": "24",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 178,
"label": "text",
"bbox": {
"l": 411.5,
"t": 411.0,
"r": 417.8,
"b": 417.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 417.4,
"r_x1": 417.8,
"r_y1": 417.4,
"r_x2": 417.8,
"r_y2": 411.0,
"r_x3": 411.5,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "25",
"orig": "25",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 179,
"label": "text",
"bbox": {
"l": 437.4,
"t": 411.0,
"r": 443.7,
"b": 417.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 417.4,
"r_x1": 443.7,
"r_y1": 417.4,
"r_x2": 443.7,
"r_y2": 411.0,
"r_x3": 437.4,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "26",
"orig": "26",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 180,
"label": "text",
"bbox": {
"l": 450.3,
"t": 411.0,
"r": 456.7,
"b": 417.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 417.4,
"r_x1": 456.7,
"r_y1": 417.4,
"r_x2": 456.7,
"r_y2": 411.0,
"r_x3": 450.3,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "27",
"orig": "27",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 181,
"label": "text",
"bbox": {
"l": 463.3,
"t": 411.0,
"r": 469.6,
"b": 417.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 417.4,
"r_x1": 469.6,
"r_y1": 417.4,
"r_x2": 469.6,
"r_y2": 411.0,
"r_x3": 463.3,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "28",
"orig": "28",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 182,
"label": "text",
"bbox": {
"l": 385.3,
"t": 421.1,
"r": 391.6,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 427.4,
"r_x1": 391.6,
"r_y1": 427.4,
"r_x2": 391.6,
"r_y2": 421.1,
"r_x3": 385.3,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 183,
"label": "text",
"bbox": {
"l": 398.5,
"t": 421.1,
"r": 404.8,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 427.4,
"r_x1": 404.8,
"r_y1": 427.4,
"r_x2": 404.8,
"r_y2": 421.1,
"r_x3": 398.5,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "31",
"orig": "31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 184,
"label": "text",
"bbox": {
"l": 411.5,
"t": 421.1,
"r": 417.8,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 427.4,
"r_x1": 417.8,
"r_y1": 427.4,
"r_x2": 417.8,
"r_y2": 421.1,
"r_x3": 411.5,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "32",
"orig": "32",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 185,
"label": "text",
"bbox": {
"l": 424.4,
"t": 421.1,
"r": 430.7,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 427.4,
"r_x1": 430.7,
"r_y1": 427.4,
"r_x2": 430.7,
"r_y2": 421.1,
"r_x3": 424.4,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "33",
"orig": "33",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 186,
"label": "text",
"bbox": {
"l": 437.4,
"t": 421.1,
"r": 443.7,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 427.4,
"r_x1": 443.7,
"r_y1": 427.4,
"r_x2": 443.7,
"r_y2": 421.1,
"r_x3": 437.4,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 187,
"label": "text",
"bbox": {
"l": 450.3,
"t": 421.1,
"r": 456.7,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 427.4,
"r_x1": 456.7,
"r_y1": 427.4,
"r_x2": 456.7,
"r_y2": 421.1,
"r_x3": 450.3,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "35",
"orig": "35",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 188,
"label": "text",
"bbox": {
"l": 463.3,
"t": 421.1,
"r": 469.6,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 427.4,
"r_x1": 469.6,
"r_y1": 427.4,
"r_x2": 469.6,
"r_y2": 421.1,
"r_x3": 463.3,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "36",
"orig": "36",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 189,
"label": "text",
"bbox": {
"l": 476.2,
"t": 421.1,
"r": 482.6,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 427.4,
"r_x1": 482.6,
"r_y1": 427.4,
"r_x2": 482.6,
"r_y2": 421.1,
"r_x3": 476.2,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "37",
"orig": "37",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 190,
"label": "text",
"bbox": {
"l": 489.2,
"t": 421.1,
"r": 495.5,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 427.4,
"r_x1": 495.5,
"r_y1": 427.4,
"r_x2": 495.5,
"r_y2": 421.1,
"r_x3": 489.2,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "38",
"orig": "38",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 191,
"label": "text",
"bbox": {
"l": 502.1,
"t": 421.1,
"r": 508.5,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 427.4,
"r_x1": 508.5,
"r_y1": 427.4,
"r_x2": 508.5,
"r_y2": 421.1,
"r_x3": 502.1,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "39",
"orig": "39",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 192,
"label": "text",
"bbox": {
"l": 515.1,
"t": 421.1,
"r": 521.4,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 427.4,
"r_x1": 521.4,
"r_y1": 427.4,
"r_x2": 521.4,
"r_y2": 421.1,
"r_x3": 515.1,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 193,
"label": "text",
"bbox": {
"l": 528.0,
"t": 421.1,
"r": 534.4,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.0,
"r_y0": 427.4,
"r_x1": 534.4,
"r_y1": 427.4,
"r_x2": 534.4,
"r_y2": 421.1,
"r_x3": 528.0,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "41",
"orig": "41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 194,
"label": "text",
"bbox": {
"l": 385.3,
"t": 432.0,
"r": 391.6,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 438.4,
"r_x1": 391.6,
"r_y1": 438.4,
"r_x2": 391.6,
"r_y2": 432.0,
"r_x3": 385.3,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "42",
"orig": "42",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 195,
"label": "text",
"bbox": {
"l": 398.5,
"t": 432.0,
"r": 404.8,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 438.4,
"r_x1": 404.8,
"r_y1": 438.4,
"r_x2": 404.8,
"r_y2": 432.0,
"r_x3": 398.5,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "43",
"orig": "43",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 196,
"label": "text",
"bbox": {
"l": 411.5,
"t": 432.0,
"r": 417.8,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 438.4,
"r_x1": 417.8,
"r_y1": 438.4,
"r_x2": 417.8,
"r_y2": 432.0,
"r_x3": 411.5,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "44",
"orig": "44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 197,
"label": "text",
"bbox": {
"l": 424.4,
"t": 432.0,
"r": 430.7,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 438.4,
"r_x1": 430.7,
"r_y1": 438.4,
"r_x2": 430.7,
"r_y2": 432.0,
"r_x3": 424.4,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "45",
"orig": "45",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 198,
"label": "text",
"bbox": {
"l": 437.4,
"t": 432.0,
"r": 443.7,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 438.4,
"r_x1": 443.7,
"r_y1": 438.4,
"r_x2": 443.7,
"r_y2": 432.0,
"r_x3": 437.4,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "46",
"orig": "46",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 199,
"label": "text",
"bbox": {
"l": 450.3,
"t": 432.0,
"r": 456.7,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 438.4,
"r_x1": 456.7,
"r_y1": 438.4,
"r_x2": 456.7,
"r_y2": 432.0,
"r_x3": 450.3,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "47",
"orig": "47",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 200,
"label": "text",
"bbox": {
"l": 463.3,
"t": 432.0,
"r": 469.6,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 438.4,
"r_x1": 469.6,
"r_y1": 438.4,
"r_x2": 469.6,
"r_y2": 432.0,
"r_x3": 463.3,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "48",
"orig": "48",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 201,
"label": "text",
"bbox": {
"l": 476.2,
"t": 432.0,
"r": 482.6,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 438.4,
"r_x1": 482.6,
"r_y1": 438.4,
"r_x2": 482.6,
"r_y2": 432.0,
"r_x3": 476.2,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "49",
"orig": "49",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 202,
"label": "text",
"bbox": {
"l": 489.2,
"t": 432.0,
"r": 495.5,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 438.4,
"r_x1": 495.5,
"r_y1": 438.4,
"r_x2": 495.5,
"r_y2": 432.0,
"r_x3": 489.2,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 203,
"label": "text",
"bbox": {
"l": 502.1,
"t": 432.0,
"r": 508.5,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 438.4,
"r_x1": 508.5,
"r_y1": 438.4,
"r_x2": 508.5,
"r_y2": 432.0,
"r_x3": 502.1,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "51",
"orig": "51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 204,
"label": "text",
"bbox": {
"l": 515.1,
"t": 432.0,
"r": 521.4,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 438.4,
"r_x1": 521.4,
"r_y1": 438.4,
"r_x2": 521.4,
"r_y2": 432.0,
"r_x3": 515.1,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "52",
"orig": "52",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 205,
"label": "text",
"bbox": {
"l": 528.0,
"t": 432.0,
"r": 534.4,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.0,
"r_y0": 438.4,
"r_x1": 534.4,
"r_y1": 438.4,
"r_x2": 534.4,
"r_y2": 432.0,
"r_x3": 528.0,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "53",
"orig": "53",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 206,
"label": "text",
"bbox": {
"l": 385.3,
"t": 389.2,
"r": 388.4,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 395.5,
"r_x1": 388.4,
"r_y1": 395.5,
"r_x2": 388.4,
"r_y2": 389.2,
"r_x3": 385.3,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 207,
"label": "text",
"bbox": {
"l": 398.5,
"t": 389.2,
"r": 401.7,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 395.5,
"r_x1": 401.7,
"r_y1": 395.5,
"r_x2": 401.7,
"r_y2": 389.2,
"r_x3": 398.5,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 208,
"label": "text",
"bbox": {
"l": 411.5,
"t": 389.2,
"r": 414.6,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 395.5,
"r_x1": 414.6,
"r_y1": 395.5,
"r_x2": 414.6,
"r_y2": 389.2,
"r_x3": 411.5,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 209,
"label": "text",
"bbox": {
"l": 424.4,
"t": 389.2,
"r": 427.6,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 395.5,
"r_x1": 427.6,
"r_y1": 395.5,
"r_x2": 427.6,
"r_y2": 389.2,
"r_x3": 424.4,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 210,
"label": "text",
"bbox": {
"l": 437.4,
"t": 389.2,
"r": 440.5,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 395.5,
"r_x1": 440.5,
"r_y1": 395.5,
"r_x2": 440.5,
"r_y2": 389.2,
"r_x3": 437.4,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 211,
"label": "text",
"bbox": {
"l": 450.3,
"t": 389.2,
"r": 453.5,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 395.5,
"r_x1": 453.5,
"r_y1": 395.5,
"r_x2": 453.5,
"r_y2": 389.2,
"r_x3": 450.3,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 212,
"label": "text",
"bbox": {
"l": 463.3,
"t": 389.2,
"r": 466.4,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 395.5,
"r_x1": 466.4,
"r_y1": 395.5,
"r_x2": 466.4,
"r_y2": 389.2,
"r_x3": 463.3,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 213,
"label": "text",
"bbox": {
"l": 476.2,
"t": 389.2,
"r": 479.4,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 395.5,
"r_x1": 479.4,
"r_y1": 395.5,
"r_x2": 479.4,
"r_y2": 389.2,
"r_x3": 476.2,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 214,
"label": "text",
"bbox": {
"l": 489.2,
"t": 389.2,
"r": 492.3,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 395.5,
"r_x1": 492.3,
"r_y1": 395.5,
"r_x2": 492.3,
"r_y2": 389.2,
"r_x3": 489.2,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 215,
"label": "text",
"bbox": {
"l": 502.1,
"t": 389.2,
"r": 505.3,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 395.5,
"r_x1": 505.3,
"r_y1": 395.5,
"r_x2": 505.3,
"r_y2": 389.2,
"r_x3": 502.1,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 216,
"label": "text",
"bbox": {
"l": 515.1,
"t": 389.2,
"r": 521.4,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 395.5,
"r_x1": 521.4,
"r_y1": 395.5,
"r_x2": 521.4,
"r_y2": 389.2,
"r_x3": 515.1,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 217,
"label": "text",
"bbox": {
"l": 528.0,
"t": 389.2,
"r": 534.1,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.0,
"r_y0": 395.5,
"r_x1": 534.1,
"r_y1": 395.5,
"r_x2": 534.1,
"r_y2": 389.2,
"r_x3": 528.0,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 218,
"label": "text",
"bbox": {
"l": 385.3,
"t": 399.0,
"r": 391.6,
"b": 405.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 405.3,
"r_x1": 391.6,
"r_y1": 405.3,
"r_x2": 391.6,
"r_y2": 399.0,
"r_x3": 385.3,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 219,
"label": "text",
"bbox": {
"l": 398.5,
"t": 399.0,
"r": 404.8,
"b": 405.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 405.3,
"r_x1": 404.8,
"r_y1": 405.3,
"r_x2": 404.8,
"r_y2": 399.0,
"r_x3": 398.5,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 220,
"label": "text",
"bbox": {
"l": 411.5,
"t": 399.0,
"r": 417.8,
"b": 405.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 405.3,
"r_x1": 417.8,
"r_y1": 405.3,
"r_x2": 417.8,
"r_y2": 399.0,
"r_x3": 411.5,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 221,
"label": "text",
"bbox": {
"l": 424.4,
"t": 406.8,
"r": 430.7,
"b": 413.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 413.1,
"r_x1": 430.7,
"r_y1": 413.1,
"r_x2": 430.7,
"r_y2": 406.8,
"r_x3": 424.4,
"r_y3": 406.8,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 222,
"label": "text",
"bbox": {
"l": 502.9,
"t": 411.0,
"r": 509.2,
"b": 417.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.9,
"r_y0": 417.3,
"r_x1": 509.2,
"r_y1": 417.3,
"r_x2": 509.2,
"r_y2": 411.0,
"r_x3": 502.9,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "29",
"orig": "29",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 223,
"label": "text",
"bbox": {
"l": 384.4,
"t": 381.8,
"r": 431.0,
"b": 386.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.4,
"r_y0": 386.4,
"r_x1": 431.0,
"r_y1": 386.4,
"r_x2": 431.0,
"r_y2": 381.8,
"r_x3": 384.4,
"r_y3": 381.8,
"coord_origin": "TOPLEFT"
},
"text": "Predicted Structure",
"orig": "Predicted Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 5,
"label": "caption",
"bbox": {
"l": 62.6,
"t": 458.7,
"r": 532.6,
"b": 467.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.92,
"cells": [
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.6,
"r_y0": 467.6,
"r_x1": 532.6,
"r_y1": 467.6,
"r_x2": 532.6,
"r_y2": 458.7,
"r_x3": 62.6,
"r_y3": 458.7,
"coord_origin": "TOPLEFT"
},
"text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.",
"orig": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 491.4,
"r": 163.8,
"b": 501.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 501.2,
"r_x1": 64.4,
"r_y1": 501.2,
"r_x2": 64.4,
"r_y2": 491.4,
"r_x3": 50.1,
"r_y3": 491.4,
"coord_origin": "TOPLEFT"
},
"text": "5.5.",
"orig": "5.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.0,
"r_y0": 501.2,
"r_x1": 163.8,
"r_y1": 501.2,
"r_x2": 163.8,
"r_y2": 491.4,
"r_x3": 74.0,
"r_y3": 491.4,
"coord_origin": "TOPLEFT"
},
"text": "Qualitative Analysis",
"orig": "Qualitative Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "text",
"bbox": {
"l": 50.1,
"t": 536.9,
"r": 286.4,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 545.8,
"r_x1": 286.4,
"r_y1": 545.8,
"r_x2": 286.4,
"r_y2": 536.9,
"r_x3": 62.1,
"r_y3": 536.9,
"coord_origin": "TOPLEFT"
},
"text": "We showcase several visualizations for the different",
"orig": "We showcase several visualizations for the different",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 557.7,
"r_x1": 211.2,
"r_y1": 557.7,
"r_x2": 211.2,
"r_y2": 548.8,
"r_x3": 50.1,
"r_y3": 548.8,
"coord_origin": "TOPLEFT"
},
"text": "components of our network on various",
"orig": "components of our network on various",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 215.1,
"r_y0": 557.5,
"r_x1": 259.2,
"r_y1": 557.5,
"r_x2": 259.2,
"r_y2": 548.9,
"r_x3": 215.1,
"r_y3": 548.9,
"coord_origin": "TOPLEFT"
},
"text": "\u201ccomplex\u201d",
"orig": "\u201ccomplex\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.1,
"r_y0": 557.7,
"r_x1": 286.4,
"r_y1": 557.7,
"r_x2": 286.4,
"r_y2": 548.8,
"r_x3": 263.1,
"r_y3": 548.8,
"coord_origin": "TOPLEFT"
},
"text": "tables",
"orig": "tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 569.7,
"r_x1": 286.4,
"r_y1": 569.7,
"r_x2": 286.4,
"r_y2": 560.8,
"r_x3": 50.1,
"r_y3": 560.8,
"coord_origin": "TOPLEFT"
},
"text": "within datasets presented in this work in Fig. 5 and Fig. 6",
"orig": "within datasets presented in this work in Fig. 5 and Fig. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 581.6,
"r_x1": 286.4,
"r_y1": 581.6,
"r_x2": 286.4,
"r_y2": 572.7,
"r_x3": 50.1,
"r_y3": 572.7,
"coord_origin": "TOPLEFT"
},
"text": "As it is shown, our model is able to predict bounding boxes",
"orig": "As it is shown, our model is able to predict bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 593.6,
"r_x1": 286.4,
"r_y1": 593.6,
"r_x2": 286.4,
"r_y2": 584.7,
"r_x3": 50.1,
"r_y3": 584.7,
"coord_origin": "TOPLEFT"
},
"text": "for all table cells, even for the empty ones. Additionally,",
"orig": "for all table cells, even for the empty ones. Additionally,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 605.6,
"r_x1": 286.4,
"r_y1": 605.6,
"r_x2": 286.4,
"r_y2": 596.6,
"r_x3": 50.1,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "our post-processing techniques can extract the cell content",
"orig": "our post-processing techniques can extract the cell content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 617.5,
"r_x1": 286.4,
"r_y1": 617.5,
"r_x2": 286.4,
"r_y2": 608.6,
"r_x3": 50.1,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "by matching the predicted bounding boxes to the PDF cells",
"orig": "by matching the predicted bounding boxes to the PDF cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 629.5,
"r_x1": 286.4,
"r_y1": 629.5,
"r_x2": 286.4,
"r_y2": 620.6,
"r_x3": 50.1,
"r_y3": 620.6,
"coord_origin": "TOPLEFT"
},
"text": "based on their overlap and spatial proximity. The left part",
"orig": "based on their overlap and spatial proximity. The left part",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 641.4,
"r_x1": 286.4,
"r_y1": 641.4,
"r_x2": 286.4,
"r_y2": 632.5,
"r_x3": 50.1,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": "of Fig. 5 demonstrates also the adaptability of our method",
"orig": "of Fig. 5 demonstrates also the adaptability of our method",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 653.4,
"r_x1": 286.4,
"r_y1": 653.4,
"r_x2": 286.4,
"r_y2": 644.5,
"r_x3": 50.1,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "to any language, as it can successfully extract Japanese",
"orig": "to any language, as it can successfully extract Japanese",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 665.3,
"r_x1": 286.4,
"r_y1": 665.3,
"r_x2": 286.4,
"r_y2": 656.4,
"r_x3": 50.1,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "text, although the training set contains only English content.",
"orig": "text, although the training set contains only English content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.3,
"r_x1": 286.4,
"r_y1": 677.3,
"r_x2": 286.4,
"r_y2": 668.4,
"r_x3": 50.1,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "We provide more visualizations including the intermediate",
"orig": "We provide more visualizations including the intermediate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 689.2,
"r_x1": 286.4,
"r_y1": 689.2,
"r_x2": 286.4,
"r_y2": 680.3,
"r_x3": 50.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "steps in the supplementary material. Overall these illustra-",
"orig": "steps in the supplementary material. Overall these illustra-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "tions justify the versatility of our method across a diverse",
"orig": "tions justify the versatility of our method across a diverse",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 226.9,
"r_y1": 713.2,
"r_x2": 226.9,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "range of table appearances and content type.",
"orig": "range of table appearances and content type.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "section_header",
"bbox": {
"l": 308.9,
"t": 490.7,
"r": 460.8,
"b": 501.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 501.5,
"r_x1": 316.1,
"r_y1": 501.5,
"r_x2": 316.1,
"r_y2": 490.7,
"r_x3": 308.9,
"r_y3": 490.7,
"coord_origin": "TOPLEFT"
},
"text": "6.",
"orig": "6.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 325.7,
"r_y0": 501.5,
"r_x1": 460.8,
"r_y1": 501.5,
"r_x2": 460.8,
"r_y2": 490.7,
"r_x3": 325.7,
"r_y3": 490.7,
"coord_origin": "TOPLEFT"
},
"text": "Future Work & Conclusion",
"orig": "Future Work & Conclusion",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 0,
"label": "text",
"bbox": {
"l": 308.9,
"t": 512.9,
"r": 545.1,
"b": 653.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 521.8,
"r_x1": 545.1,
"r_y1": 521.8,
"r_x2": 545.1,
"r_y2": 512.9,
"r_x3": 320.8,
"r_y3": 512.9,
"coord_origin": "TOPLEFT"
},
"text": "In this paper, we presented TableFormer an end-to-end",
"orig": "In this paper, we presented TableFormer an end-to-end",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 533.8,
"r_x1": 545.1,
"r_y1": 533.8,
"r_x2": 545.1,
"r_y2": 524.8,
"r_x3": 308.9,
"r_y3": 524.8,
"coord_origin": "TOPLEFT"
},
"text": "transformer based approach to predict table structures and",
"orig": "transformer based approach to predict table structures and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 545.7,
"r_x1": 545.1,
"r_y1": 545.7,
"r_x2": 545.1,
"r_y2": 536.8,
"r_x3": 308.9,
"r_y3": 536.8,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes of cells from an image. This approach en-",
"orig": "bounding boxes of cells from an image. This approach en-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 557.7,
"r_x1": 545.1,
"r_y1": 557.7,
"r_x2": 545.1,
"r_y2": 548.8,
"r_x3": 308.9,
"r_y3": 548.8,
"coord_origin": "TOPLEFT"
},
"text": "ables us to recreate the table structure, and extract the cell",
"orig": "ables us to recreate the table structure, and extract the cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 569.6,
"r_x1": 545.1,
"r_y1": 569.6,
"r_x2": 545.1,
"r_y2": 560.7,
"r_x3": 308.9,
"r_y3": 560.7,
"coord_origin": "TOPLEFT"
},
"text": "content from PDF or OCR by using bounding boxes. Ad-",
"orig": "content from PDF or OCR by using bounding boxes. Ad-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 581.6,
"r_x1": 545.1,
"r_y1": 581.6,
"r_x2": 545.1,
"r_y2": 572.7,
"r_x3": 308.9,
"r_y3": 572.7,
"coord_origin": "TOPLEFT"
},
"text": "ditionally, it provides the versatility required in real-world",
"orig": "ditionally, it provides the versatility required in real-world",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 593.5,
"r_x1": 545.1,
"r_y1": 593.5,
"r_x2": 545.1,
"r_y2": 584.6,
"r_x3": 308.9,
"r_y3": 584.6,
"coord_origin": "TOPLEFT"
},
"text": "scenarios when dealing with various types of PDF docu-",
"orig": "scenarios when dealing with various types of PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 605.5,
"r_x1": 400.5,
"r_y1": 605.5,
"r_x2": 400.5,
"r_y2": 596.6,
"r_x3": 308.9,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "ments, and languages.",
"orig": "ments, and languages.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.4,
"r_y0": 605.5,
"r_x1": 545.1,
"r_y1": 605.5,
"r_x2": 545.1,
"r_y2": 596.6,
"r_x3": 408.4,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "Furthermore, our method outper-",
"orig": "Furthermore, our method outper-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 212,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 617.4,
"r_x1": 545.1,
"r_y1": 617.4,
"r_x2": 545.1,
"r_y2": 608.5,
"r_x3": 308.9,
"r_y3": 608.5,
"coord_origin": "TOPLEFT"
},
"text": "forms all state-of-the-arts with a wide margin. Finally, we",
"orig": "forms all state-of-the-arts with a wide margin. Finally, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 213,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 629.4,
"r_x1": 545.1,
"r_y1": 629.4,
"r_x2": 545.1,
"r_y2": 620.5,
"r_x3": 308.9,
"r_y3": 620.5,
"coord_origin": "TOPLEFT"
},
"text": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-",
"orig": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 214,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 641.4,
"r_x1": 545.1,
"r_y1": 641.4,
"r_x2": 545.1,
"r_y2": 632.4,
"r_x3": 308.9,
"r_y3": 632.4,
"coord_origin": "TOPLEFT"
},
"text": "erated dataset that reinforces missing characteristics from",
"orig": "erated dataset that reinforces missing characteristics from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 215,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 653.3,
"r_x1": 365.9,
"r_y1": 653.3,
"r_x2": 365.9,
"r_y2": 644.4,
"r_x3": 308.9,
"r_y3": 644.4,
"coord_origin": "TOPLEFT"
},
"text": "other datasets.",
"orig": "other datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "section_header",
"bbox": {
"l": 308.9,
"t": 672.1,
"r": 364.4,
"b": 682.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 216,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 682.8,
"r_x1": 364.4,
"r_y1": 682.8,
"r_x2": 364.4,
"r_y2": 672.1,
"r_x3": 308.9,
"r_y3": 672.1,
"coord_origin": "TOPLEFT"
},
"text": "References",
"orig": "References",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 10,
"label": "list_item",
"bbox": {
"l": 313.3,
"t": 694.0,
"r": 545.1,
"b": 712.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.83,
"cells": [
{
"index": 217,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.3,
"r_y0": 702.0,
"r_x1": 323.8,
"r_y1": 702.0,
"r_x2": 323.8,
"r_y2": 694.0,
"r_x3": 313.3,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "[1]",
"orig": "[1]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 218,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.1,
"r_y0": 702.0,
"r_x1": 545.1,
"r_y1": 702.0,
"r_x2": 545.1,
"r_y2": 694.0,
"r_x3": 326.1,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas",
"orig": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 219,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 712.9,
"r_x1": 545.1,
"r_y1": 712.9,
"r_x2": 545.1,
"r_y2": 704.9,
"r_x3": 328.8,
"r_y3": 704.9,
"coord_origin": "TOPLEFT"
},
"text": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-",
"orig": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 9,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.87,
"cells": [
{
"index": 220,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 15,
"label": "picture",
"bbox": {
"l": 305.6,
"t": 98.7,
"r": 554.8,
"b": 180.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.77,
"cells": [],
"children": []
},
{
"id": 14,
"label": "picture",
"bbox": {
"l": 50.0,
"t": 103.7,
"r": 301.6,
"b": 187.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.79,
"cells": [],
"children": []
}
]
},
"tablestructure": {
"table_map": {
"8": {
"label": "table",
"id": 8,
"page_no": 7,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 53.6,
"t": 218.9,
"r": 298.6,
"b": 292.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.9,
"r_y0": 226.4,
"r_x1": 241.0,
"r_y1": 226.4,
"r_x2": 241.0,
"r_y2": 222.2,
"r_x3": 209.9,
"r_y3": 222.2,
"coord_origin": "TOPLEFT"
},
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.8,
"r_y0": 226.4,
"r_x1": 284.5,
"r_y1": 226.4,
"r_x2": 284.5,
"r_y2": 222.2,
"r_x3": 263.8,
"r_y3": 222.2,
"coord_origin": "TOPLEFT"
},
"text": "\u53c2\u8003\u6587\u732e",
"orig": "\u53c2\u8003\u6587\u732e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.2,
"r_y0": 233.8,
"r_x1": 120.6,
"r_y1": 233.8,
"r_x2": 120.6,
"r_y2": 229.7,
"r_x3": 110.2,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u51fa\u5178",
"orig": "\u51fa\u5178",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.4,
"r_y0": 233.8,
"r_x1": 196.1,
"r_y1": 233.8,
"r_x2": 196.1,
"r_y2": 229.7,
"r_x3": 175.4,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u30d5\u30a1\u30a4\u30eb",
"orig": "\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.1,
"r_y0": 233.8,
"r_x1": 201.3,
"r_y1": 233.8,
"r_x2": 201.3,
"r_y2": 229.7,
"r_x3": 196.1,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u6570",
"orig": "\u6570",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.6,
"r_y0": 233.8,
"r_x1": 220.0,
"r_y1": 233.8,
"r_x2": 220.0,
"r_y2": 229.7,
"r_x3": 209.6,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.2,
"r_y0": 233.8,
"r_x1": 244.8,
"r_y1": 233.8,
"r_x2": 244.8,
"r_y2": 229.7,
"r_x3": 229.2,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.1,
"r_y0": 233.8,
"r_x1": 266.5,
"r_y1": 233.8,
"r_x2": 266.5,
"r_y2": 229.7,
"r_x3": 256.1,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.4,
"r_y0": 233.8,
"r_x1": 293.9,
"r_y1": 233.8,
"r_x2": 293.9,
"r_y2": 229.7,
"r_x3": 278.4,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 240.8,
"r_x1": 162.7,
"r_y1": 240.8,
"r_x2": 162.7,
"r_y2": 236.4,
"r_x3": 55.5,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "Association for Computational Linguistics(ACL2003)",
"orig": "Association for Computational Linguistics(ACL2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 240.8,
"r_x1": 189.6,
"r_y1": 240.8,
"r_x2": 189.6,
"r_y2": 236.4,
"r_x3": 184.4,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 240.8,
"r_x1": 214.2,
"r_y1": 240.8,
"r_x2": 214.2,
"r_y2": 236.4,
"r_x3": 209.0,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.9,
"r_y0": 240.8,
"r_x1": 237.5,
"r_y1": 240.8,
"r_x2": 237.5,
"r_y2": 236.4,
"r_x3": 234.9,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 240.8,
"r_x1": 264.6,
"r_y1": 240.8,
"r_x2": 264.6,
"r_y2": 236.4,
"r_x3": 256.9,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.1,
"r_y0": 240.8,
"r_x1": 286.6,
"r_y1": 240.8,
"r_x2": 286.6,
"r_y2": 236.4,
"r_x3": 284.1,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 247.0,
"r_x1": 139.7,
"r_y1": 247.0,
"r_x2": 139.7,
"r_y2": 242.6,
"r_x3": 55.5,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "Computational Linguistics(COLING2002)",
"orig": "Computational Linguistics(COLING2002)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 247.0,
"r_x1": 190.9,
"r_y1": 247.0,
"r_x2": 190.9,
"r_y2": 242.6,
"r_x3": 183.1,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 247.0,
"r_x1": 215.4,
"r_y1": 247.0,
"r_x2": 215.4,
"r_y2": 242.6,
"r_x3": 207.7,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.9,
"r_y0": 247.0,
"r_x1": 237.5,
"r_y1": 247.0,
"r_x2": 237.5,
"r_y2": 242.6,
"r_x3": 234.9,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 247.0,
"r_x1": 264.6,
"r_y1": 247.0,
"r_x2": 264.6,
"r_y2": 242.6,
"r_x3": 256.9,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.1,
"r_y0": 247.0,
"r_x1": 286.6,
"r_y1": 247.0,
"r_x2": 286.6,
"r_y2": 242.6,
"r_x3": 284.1,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 254.0,
"r_x1": 97.0,
"r_y1": 254.0,
"r_x2": 97.0,
"r_y2": 249.8,
"r_x3": 55.5,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 92.7,
"r_y0": 253.9,
"r_x1": 103.0,
"r_y1": 253.9,
"r_x2": 103.0,
"r_y2": 249.6,
"r_x3": 92.7,
"r_y3": 249.6,
"coord_origin": "TOPLEFT"
},
"text": "2003",
"orig": "2003",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.0,
"r_y0": 254.0,
"r_x1": 129.0,
"r_y1": 254.0,
"r_x2": 129.0,
"r_y2": 249.8,
"r_x3": 103.0,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"orig": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 253.2,
"r_x1": 190.9,
"r_y1": 253.2,
"r_x2": 190.9,
"r_y2": 248.8,
"r_x3": 183.1,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 253.2,
"r_x1": 212.9,
"r_y1": 253.2,
"r_x2": 212.9,
"r_y2": 248.8,
"r_x3": 210.3,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 253.2,
"r_x1": 240.0,
"r_y1": 253.2,
"r_x2": 240.0,
"r_y2": 248.8,
"r_x3": 232.3,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "142",
"orig": "142",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 253.2,
"r_x1": 264.6,
"r_y1": 253.2,
"r_x2": 264.6,
"r_y2": 248.8,
"r_x3": 256.9,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "223",
"orig": "223",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 253.2,
"r_x1": 289.2,
"r_y1": 253.2,
"r_x2": 289.2,
"r_y2": 248.8,
"r_x3": 281.5,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 261.5,
"r_x1": 91.8,
"r_y1": 261.5,
"r_x2": 91.8,
"r_y2": 257.3,
"r_x3": 55.5,
"r_y3": 257.3,
"coord_origin": "TOPLEFT"
},
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.1,
"r_y0": 261.4,
"r_x1": 93.2,
"r_y1": 261.4,
"r_x2": 93.2,
"r_y2": 257.1,
"r_x3": 88.1,
"r_y3": 257.1,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.2,
"r_y0": 261.5,
"r_x1": 119.1,
"r_y1": 261.5,
"r_x2": 119.1,
"r_y2": 257.3,
"r_x3": 93.2,
"r_y3": 257.3,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.5,
"r_y0": 261.4,
"r_x1": 129.9,
"r_y1": 261.4,
"r_x2": 129.9,
"r_y2": 257.1,
"r_x3": 116.5,
"r_y3": 257.1,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 260.7,
"r_x1": 190.9,
"r_y1": 260.7,
"r_x2": 190.9,
"r_y2": 256.3,
"r_x3": 183.1,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "177",
"orig": "177",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 260.7,
"r_x1": 212.9,
"r_y1": 260.7,
"r_x2": 212.9,
"r_y2": 256.3,
"r_x3": 210.3,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 260.7,
"r_x1": 240.0,
"r_y1": 260.7,
"r_x2": 240.0,
"r_y2": 256.3,
"r_x3": 232.3,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "176",
"orig": "176",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 260.7,
"r_x1": 264.6,
"r_y1": 260.7,
"r_x2": 264.6,
"r_y2": 256.3,
"r_x3": 256.9,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 260.7,
"r_x1": 289.2,
"r_y1": 260.7,
"r_x2": 289.2,
"r_y2": 256.3,
"r_x3": 281.5,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "236",
"orig": "236",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 268.7,
"r_x1": 60.7,
"r_y1": 268.7,
"r_x2": 60.7,
"r_y2": 264.5,
"r_x3": 55.5,
"r_y3": 264.5,
"coord_origin": "TOPLEFT"
},
"text": "\u7b2c",
"orig": "\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.2,
"r_y0": 268.7,
"r_x1": 65.3,
"r_y1": 268.7,
"r_x2": 65.3,
"r_y2": 264.3,
"r_x3": 60.2,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.3,
"r_y0": 268.7,
"r_x1": 122.4,
"r_y1": 268.7,
"r_x2": 122.4,
"r_y2": 264.5,
"r_x3": 65.3,
"r_y3": 264.5,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.5,
"r_y0": 268.7,
"r_x1": 129.9,
"r_y1": 268.7,
"r_x2": 129.9,
"r_y2": 264.3,
"r_x3": 116.5,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 267.9,
"r_x1": 190.9,
"r_y1": 267.9,
"r_x2": 190.9,
"r_y2": 263.5,
"r_x3": 183.1,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "208",
"orig": "208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 267.9,
"r_x1": 212.9,
"r_y1": 267.9,
"r_x2": 212.9,
"r_y2": 263.5,
"r_x3": 210.3,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 267.9,
"r_x1": 240.0,
"r_y1": 267.9,
"r_x2": 240.0,
"r_y2": 263.5,
"r_x3": 232.3,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "203",
"orig": "203",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 267.9,
"r_x1": 264.6,
"r_y1": 267.9,
"r_x2": 264.6,
"r_y2": 263.5,
"r_x3": 256.9,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "152",
"orig": "152",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 267.9,
"r_x1": 289.2,
"r_y1": 267.9,
"r_x2": 289.2,
"r_y2": 263.5,
"r_x3": 281.5,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "244",
"orig": "244",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 275.9,
"r_x1": 107.4,
"r_y1": 275.9,
"r_x2": 107.4,
"r_y2": 271.7,
"r_x3": 55.5,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 102.0,
"r_y0": 275.9,
"r_x1": 109.7,
"r_y1": 275.9,
"r_x2": 109.7,
"r_y2": 271.5,
"r_x3": 102.0,
"r_y3": 271.5,
"coord_origin": "TOPLEFT"
},
"text": "146",
"orig": "146",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 109.7,
"r_y0": 275.9,
"r_x1": 114.9,
"r_y1": 275.9,
"r_x2": 114.9,
"r_y2": 271.7,
"r_x3": 109.7,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u301c",
"orig": "\u301c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 114.4,
"r_y0": 275.9,
"r_x1": 122.1,
"r_y1": 275.9,
"r_x2": 122.1,
"r_y2": 271.5,
"r_x3": 114.4,
"r_y3": 271.5,
"coord_origin": "TOPLEFT"
},
"text": "155",
"orig": "155",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.1,
"r_y0": 275.9,
"r_x1": 127.3,
"r_y1": 275.9,
"r_x2": 127.3,
"r_y2": 271.7,
"r_x3": 122.1,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u56de",
"orig": "\u56de",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 275.1,
"r_x1": 189.6,
"r_y1": 275.1,
"r_x2": 189.6,
"r_y2": 270.8,
"r_x3": 184.4,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "98",
"orig": "98",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 275.1,
"r_x1": 212.9,
"r_y1": 275.1,
"r_x2": 212.9,
"r_y2": 270.8,
"r_x3": 210.3,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.6,
"r_y0": 275.1,
"r_x1": 238.8,
"r_y1": 275.1,
"r_x2": 238.8,
"r_y2": 270.8,
"r_x3": 233.6,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 275.1,
"r_x1": 264.6,
"r_y1": 275.1,
"r_x2": 264.6,
"r_y2": 270.8,
"r_x3": 256.9,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 275.1,
"r_x1": 289.2,
"r_y1": 275.1,
"r_x2": 289.2,
"r_y2": 270.8,
"r_x3": 281.5,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "232",
"orig": "232",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 283.4,
"r_x1": 68.7,
"r_y1": 283.4,
"r_x2": 68.7,
"r_y2": 279.0,
"r_x3": 55.5,
"r_y3": 279.0,
"coord_origin": "TOPLEFT"
},
"text": "WWW",
"orig": "WWW",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.7,
"r_y0": 283.4,
"r_x1": 110.2,
"r_y1": 283.4,
"r_x2": 110.2,
"r_y2": 279.2,
"r_x3": 68.7,
"r_y3": 279.2,
"coord_origin": "TOPLEFT"
},
"text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 282.3,
"r_x1": 190.9,
"r_y1": 282.3,
"r_x2": 190.9,
"r_y2": 278.0,
"r_x3": 183.1,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "107",
"orig": "107",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 282.3,
"r_x1": 214.2,
"r_y1": 282.3,
"r_x2": 214.2,
"r_y2": 278.0,
"r_x3": 209.0,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "73",
"orig": "73",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.6,
"r_y0": 282.3,
"r_x1": 238.8,
"r_y1": 282.3,
"r_x2": 238.8,
"r_y2": 278.0,
"r_x3": 233.6,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 282.3,
"r_x1": 264.6,
"r_y1": 282.3,
"r_x2": 264.6,
"r_y2": 278.0,
"r_x3": 256.9,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 282.8,
"r_y0": 282.3,
"r_x1": 287.9,
"r_y1": 282.3,
"r_x2": 287.9,
"r_y2": 278.0,
"r_x3": 282.8,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 169.6,
"r_y0": 290.6,
"r_x1": 174.8,
"r_y1": 290.6,
"r_x2": 174.8,
"r_y2": 286.5,
"r_x3": 169.6,
"r_y3": 286.5,
"coord_origin": "TOPLEFT"
},
"text": "\u8a08",
"orig": "\u8a08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 289.8,
"r_x1": 190.9,
"r_y1": 289.8,
"r_x2": 190.9,
"r_y2": 285.5,
"r_x3": 183.1,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "945",
"orig": "945",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 289.8,
"r_x1": 215.4,
"r_y1": 289.8,
"r_x2": 215.4,
"r_y2": 285.5,
"r_x3": 207.7,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "294",
"orig": "294",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 289.8,
"r_x1": 240.0,
"r_y1": 289.8,
"r_x2": 240.0,
"r_y2": 285.5,
"r_x3": 232.3,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "651",
"orig": "651",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.8,
"r_y0": 289.8,
"r_x1": 265.8,
"r_y1": 289.8,
"r_x2": 265.8,
"r_y2": 285.5,
"r_x3": 255.8,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "1122",
"orig": "1122",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 289.8,
"r_x1": 289.2,
"r_y1": 289.8,
"r_x2": 289.2,
"r_y2": 285.5,
"r_x3": 281.5,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "955",
"orig": "955",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 55,
"label": "text",
"bbox": {
"l": 209.9,
"t": 222.2,
"r": 241.0,
"b": 226.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.9,
"r_y0": 226.4,
"r_x1": 241.0,
"r_y1": 226.4,
"r_x2": 241.0,
"r_y2": 222.2,
"r_x3": 209.9,
"r_y3": 222.2,
"coord_origin": "TOPLEFT"
},
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 263.8,
"t": 222.2,
"r": 284.5,
"b": 226.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.8,
"r_y0": 226.4,
"r_x1": 284.5,
"r_y1": 226.4,
"r_x2": 284.5,
"r_y2": 222.2,
"r_x3": 263.8,
"r_y3": 222.2,
"coord_origin": "TOPLEFT"
},
"text": "\u53c2\u8003\u6587\u732e",
"orig": "\u53c2\u8003\u6587\u732e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 110.2,
"t": 229.7,
"r": 120.6,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.2,
"r_y0": 233.8,
"r_x1": 120.6,
"r_y1": 233.8,
"r_x2": 120.6,
"r_y2": 229.7,
"r_x3": 110.2,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u51fa\u5178",
"orig": "\u51fa\u5178",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 175.4,
"t": 229.7,
"r": 196.1,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.4,
"r_y0": 233.8,
"r_x1": 196.1,
"r_y1": 233.8,
"r_x2": 196.1,
"r_y2": 229.7,
"r_x3": 175.4,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u30d5\u30a1\u30a4\u30eb",
"orig": "\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 196.1,
"t": 229.7,
"r": 201.3,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.1,
"r_y0": 233.8,
"r_x1": 201.3,
"r_y1": 233.8,
"r_x2": 201.3,
"r_y2": 229.7,
"r_x3": 196.1,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u6570",
"orig": "\u6570",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 209.6,
"t": 229.7,
"r": 220.0,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.6,
"r_y0": 233.8,
"r_x1": 220.0,
"r_y1": 233.8,
"r_x2": 220.0,
"r_y2": 229.7,
"r_x3": 209.6,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 229.2,
"t": 229.7,
"r": 244.8,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.2,
"r_y0": 233.8,
"r_x1": 244.8,
"r_y1": 233.8,
"r_x2": 244.8,
"r_y2": 229.7,
"r_x3": 229.2,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 256.1,
"t": 229.7,
"r": 266.5,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.1,
"r_y0": 233.8,
"r_x1": 266.5,
"r_y1": 233.8,
"r_x2": 266.5,
"r_y2": 229.7,
"r_x3": 256.1,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 278.4,
"t": 229.7,
"r": 293.9,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.4,
"r_y0": 233.8,
"r_x1": 293.9,
"r_y1": 233.8,
"r_x2": 293.9,
"r_y2": 229.7,
"r_x3": 278.4,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 55.5,
"t": 236.4,
"r": 162.7,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 240.8,
"r_x1": 162.7,
"r_y1": 240.8,
"r_x2": 162.7,
"r_y2": 236.4,
"r_x3": 55.5,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "Association for Computational Linguistics(ACL2003)",
"orig": "Association for Computational Linguistics(ACL2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 184.4,
"t": 236.4,
"r": 189.6,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 240.8,
"r_x1": 189.6,
"r_y1": 240.8,
"r_x2": 189.6,
"r_y2": 236.4,
"r_x3": 184.4,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 209.0,
"t": 236.4,
"r": 214.2,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 240.8,
"r_x1": 214.2,
"r_y1": 240.8,
"r_x2": 214.2,
"r_y2": 236.4,
"r_x3": 209.0,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 234.9,
"t": 236.4,
"r": 237.5,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.9,
"r_y0": 240.8,
"r_x1": 237.5,
"r_y1": 240.8,
"r_x2": 237.5,
"r_y2": 236.4,
"r_x3": 234.9,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 256.9,
"t": 236.4,
"r": 264.6,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 240.8,
"r_x1": 264.6,
"r_y1": 240.8,
"r_x2": 264.6,
"r_y2": 236.4,
"r_x3": 256.9,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 284.1,
"t": 236.4,
"r": 286.6,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.1,
"r_y0": 240.8,
"r_x1": 286.6,
"r_y1": 240.8,
"r_x2": 286.6,
"r_y2": 236.4,
"r_x3": 284.1,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 55.5,
"t": 242.6,
"r": 139.7,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 247.0,
"r_x1": 139.7,
"r_y1": 247.0,
"r_x2": 139.7,
"r_y2": 242.6,
"r_x3": 55.5,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "Computational Linguistics(COLING2002)",
"orig": "Computational Linguistics(COLING2002)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 183.1,
"t": 242.6,
"r": 190.9,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 247.0,
"r_x1": 190.9,
"r_y1": 247.0,
"r_x2": 190.9,
"r_y2": 242.6,
"r_x3": 183.1,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 207.7,
"t": 242.6,
"r": 215.4,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 247.0,
"r_x1": 215.4,
"r_y1": 247.0,
"r_x2": 215.4,
"r_y2": 242.6,
"r_x3": 207.7,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 234.9,
"t": 242.6,
"r": 237.5,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.9,
"r_y0": 247.0,
"r_x1": 237.5,
"r_y1": 247.0,
"r_x2": 237.5,
"r_y2": 242.6,
"r_x3": 234.9,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 256.9,
"t": 242.6,
"r": 264.6,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 247.0,
"r_x1": 264.6,
"r_y1": 247.0,
"r_x2": 264.6,
"r_y2": 242.6,
"r_x3": 256.9,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 284.1,
"t": 242.6,
"r": 286.6,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.1,
"r_y0": 247.0,
"r_x1": 286.6,
"r_y1": 247.0,
"r_x2": 286.6,
"r_y2": 242.6,
"r_x3": 284.1,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 55.5,
"t": 249.8,
"r": 97.0,
"b": 254.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 254.0,
"r_x1": 97.0,
"r_y1": 254.0,
"r_x2": 97.0,
"r_y2": 249.8,
"r_x3": 55.5,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 92.7,
"t": 249.6,
"r": 103.0,
"b": 253.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 92.7,
"r_y0": 253.9,
"r_x1": 103.0,
"r_y1": 253.9,
"r_x2": 103.0,
"r_y2": 249.6,
"r_x3": 92.7,
"r_y3": 249.6,
"coord_origin": "TOPLEFT"
},
"text": "2003",
"orig": "2003",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 103.0,
"t": 249.8,
"r": 129.0,
"b": 254.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.0,
"r_y0": 254.0,
"r_x1": 129.0,
"r_y1": 254.0,
"r_x2": 129.0,
"r_y2": 249.8,
"r_x3": 103.0,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"orig": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 183.1,
"t": 248.8,
"r": 190.9,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 253.2,
"r_x1": 190.9,
"r_y1": 253.2,
"r_x2": 190.9,
"r_y2": 248.8,
"r_x3": 183.1,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 210.3,
"t": 248.8,
"r": 212.9,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 253.2,
"r_x1": 212.9,
"r_y1": 253.2,
"r_x2": 212.9,
"r_y2": 248.8,
"r_x3": 210.3,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 232.3,
"t": 248.8,
"r": 240.0,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 253.2,
"r_x1": 240.0,
"r_y1": 253.2,
"r_x2": 240.0,
"r_y2": 248.8,
"r_x3": 232.3,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "142",
"orig": "142",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 256.9,
"t": 248.8,
"r": 264.6,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 253.2,
"r_x1": 264.6,
"r_y1": 253.2,
"r_x2": 264.6,
"r_y2": 248.8,
"r_x3": 256.9,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "223",
"orig": "223",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 83,
"label": "text",
"bbox": {
"l": 281.5,
"t": 248.8,
"r": 289.2,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 253.2,
"r_x1": 289.2,
"r_y1": 253.2,
"r_x2": 289.2,
"r_y2": 248.8,
"r_x3": 281.5,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 55.5,
"t": 257.3,
"r": 91.8,
"b": 261.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 261.5,
"r_x1": 91.8,
"r_y1": 261.5,
"r_x2": 91.8,
"r_y2": 257.3,
"r_x3": 55.5,
"r_y3": 257.3,
"coord_origin": "TOPLEFT"
},
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 88.1,
"t": 257.1,
"r": 93.2,
"b": 261.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.1,
"r_y0": 261.4,
"r_x1": 93.2,
"r_y1": 261.4,
"r_x2": 93.2,
"r_y2": 257.1,
"r_x3": 88.1,
"r_y3": 257.1,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 93.2,
"t": 257.3,
"r": 119.1,
"b": 261.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.2,
"r_y0": 261.5,
"r_x1": 119.1,
"r_y1": 261.5,
"r_x2": 119.1,
"r_y2": 257.3,
"r_x3": 93.2,
"r_y3": 257.3,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 116.5,
"t": 257.1,
"r": 129.9,
"b": 261.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.5,
"r_y0": 261.4,
"r_x1": 129.9,
"r_y1": 261.4,
"r_x2": 129.9,
"r_y2": 257.1,
"r_x3": 116.5,
"r_y3": 257.1,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 183.1,
"t": 256.3,
"r": 190.9,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 260.7,
"r_x1": 190.9,
"r_y1": 260.7,
"r_x2": 190.9,
"r_y2": 256.3,
"r_x3": 183.1,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "177",
"orig": "177",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 210.3,
"t": 256.3,
"r": 212.9,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 260.7,
"r_x1": 212.9,
"r_y1": 260.7,
"r_x2": 212.9,
"r_y2": 256.3,
"r_x3": 210.3,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 232.3,
"t": 256.3,
"r": 240.0,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 260.7,
"r_x1": 240.0,
"r_y1": 260.7,
"r_x2": 240.0,
"r_y2": 256.3,
"r_x3": 232.3,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "176",
"orig": "176",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 256.9,
"t": 256.3,
"r": 264.6,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 260.7,
"r_x1": 264.6,
"r_y1": 260.7,
"r_x2": 264.6,
"r_y2": 256.3,
"r_x3": 256.9,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 281.5,
"t": 256.3,
"r": 289.2,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 260.7,
"r_x1": 289.2,
"r_y1": 260.7,
"r_x2": 289.2,
"r_y2": 256.3,
"r_x3": 281.5,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "236",
"orig": "236",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 55.5,
"t": 264.5,
"r": 60.7,
"b": 268.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 268.7,
"r_x1": 60.7,
"r_y1": 268.7,
"r_x2": 60.7,
"r_y2": 264.5,
"r_x3": 55.5,
"r_y3": 264.5,
"coord_origin": "TOPLEFT"
},
"text": "\u7b2c",
"orig": "\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 60.2,
"t": 264.3,
"r": 65.3,
"b": 268.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.2,
"r_y0": 268.7,
"r_x1": 65.3,
"r_y1": 268.7,
"r_x2": 65.3,
"r_y2": 264.3,
"r_x3": 60.2,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 65.3,
"t": 264.5,
"r": 122.4,
"b": 268.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.3,
"r_y0": 268.7,
"r_x1": 122.4,
"r_y1": 268.7,
"r_x2": 122.4,
"r_y2": 264.5,
"r_x3": 65.3,
"r_y3": 264.5,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 116.5,
"t": 264.3,
"r": 129.9,
"b": 268.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.5,
"r_y0": 268.7,
"r_x1": 129.9,
"r_y1": 268.7,
"r_x2": 129.9,
"r_y2": 264.3,
"r_x3": 116.5,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 183.1,
"t": 263.5,
"r": 190.9,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 267.9,
"r_x1": 190.9,
"r_y1": 267.9,
"r_x2": 190.9,
"r_y2": 263.5,
"r_x3": 183.1,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "208",
"orig": "208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 210.3,
"t": 263.5,
"r": 212.9,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 267.9,
"r_x1": 212.9,
"r_y1": 267.9,
"r_x2": 212.9,
"r_y2": 263.5,
"r_x3": 210.3,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 99,
"label": "text",
"bbox": {
"l": 232.3,
"t": 263.5,
"r": 240.0,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 267.9,
"r_x1": 240.0,
"r_y1": 267.9,
"r_x2": 240.0,
"r_y2": 263.5,
"r_x3": 232.3,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "203",
"orig": "203",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 256.9,
"t": 263.5,
"r": 264.6,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 267.9,
"r_x1": 264.6,
"r_y1": 267.9,
"r_x2": 264.6,
"r_y2": 263.5,
"r_x3": 256.9,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "152",
"orig": "152",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 281.5,
"t": 263.5,
"r": 289.2,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 267.9,
"r_x1": 289.2,
"r_y1": 267.9,
"r_x2": 289.2,
"r_y2": 263.5,
"r_x3": 281.5,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "244",
"orig": "244",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 55.5,
"t": 271.7,
"r": 107.4,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 275.9,
"r_x1": 107.4,
"r_y1": 275.9,
"r_x2": 107.4,
"r_y2": 271.7,
"r_x3": 55.5,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 102.0,
"t": 271.5,
"r": 109.7,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 102.0,
"r_y0": 275.9,
"r_x1": 109.7,
"r_y1": 275.9,
"r_x2": 109.7,
"r_y2": 271.5,
"r_x3": 102.0,
"r_y3": 271.5,
"coord_origin": "TOPLEFT"
},
"text": "146",
"orig": "146",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 109.7,
"t": 271.7,
"r": 114.9,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 109.7,
"r_y0": 275.9,
"r_x1": 114.9,
"r_y1": 275.9,
"r_x2": 114.9,
"r_y2": 271.7,
"r_x3": 109.7,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u301c",
"orig": "\u301c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 105,
"label": "text",
"bbox": {
"l": 114.4,
"t": 271.5,
"r": 122.1,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 114.4,
"r_y0": 275.9,
"r_x1": 122.1,
"r_y1": 275.9,
"r_x2": 122.1,
"r_y2": 271.5,
"r_x3": 114.4,
"r_y3": 271.5,
"coord_origin": "TOPLEFT"
},
"text": "155",
"orig": "155",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 106,
"label": "text",
"bbox": {
"l": 122.1,
"t": 271.7,
"r": 127.3,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.1,
"r_y0": 275.9,
"r_x1": 127.3,
"r_y1": 275.9,
"r_x2": 127.3,
"r_y2": 271.7,
"r_x3": 122.1,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u56de",
"orig": "\u56de",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 107,
"label": "text",
"bbox": {
"l": 184.4,
"t": 270.8,
"r": 189.6,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 275.1,
"r_x1": 189.6,
"r_y1": 275.1,
"r_x2": 189.6,
"r_y2": 270.8,
"r_x3": 184.4,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "98",
"orig": "98",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 108,
"label": "text",
"bbox": {
"l": 210.3,
"t": 270.8,
"r": 212.9,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 275.1,
"r_x1": 212.9,
"r_y1": 275.1,
"r_x2": 212.9,
"r_y2": 270.8,
"r_x3": 210.3,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 109,
"label": "text",
"bbox": {
"l": 233.6,
"t": 270.8,
"r": 238.8,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.6,
"r_y0": 275.1,
"r_x1": 238.8,
"r_y1": 275.1,
"r_x2": 238.8,
"r_y2": 270.8,
"r_x3": 233.6,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 110,
"label": "text",
"bbox": {
"l": 256.9,
"t": 270.8,
"r": 264.6,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 275.1,
"r_x1": 264.6,
"r_y1": 275.1,
"r_x2": 264.6,
"r_y2": 270.8,
"r_x3": 256.9,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 111,
"label": "text",
"bbox": {
"l": 281.5,
"t": 270.8,
"r": 289.2,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 275.1,
"r_x1": 289.2,
"r_y1": 275.1,
"r_x2": 289.2,
"r_y2": 270.8,
"r_x3": 281.5,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "232",
"orig": "232",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 112,
"label": "text",
"bbox": {
"l": 55.5,
"t": 279.0,
"r": 68.7,
"b": 283.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 283.4,
"r_x1": 68.7,
"r_y1": 283.4,
"r_x2": 68.7,
"r_y2": 279.0,
"r_x3": 55.5,
"r_y3": 279.0,
"coord_origin": "TOPLEFT"
},
"text": "WWW",
"orig": "WWW",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 113,
"label": "text",
"bbox": {
"l": 68.7,
"t": 279.2,
"r": 110.2,
"b": 283.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.7,
"r_y0": 283.4,
"r_x1": 110.2,
"r_y1": 283.4,
"r_x2": 110.2,
"r_y2": 279.2,
"r_x3": 68.7,
"r_y3": 279.2,
"coord_origin": "TOPLEFT"
},
"text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 114,
"label": "text",
"bbox": {
"l": 183.1,
"t": 278.0,
"r": 190.9,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 282.3,
"r_x1": 190.9,
"r_y1": 282.3,
"r_x2": 190.9,
"r_y2": 278.0,
"r_x3": 183.1,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "107",
"orig": "107",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 115,
"label": "text",
"bbox": {
"l": 209.0,
"t": 278.0,
"r": 214.2,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 282.3,
"r_x1": 214.2,
"r_y1": 282.3,
"r_x2": 214.2,
"r_y2": 278.0,
"r_x3": 209.0,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "73",
"orig": "73",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 116,
"label": "text",
"bbox": {
"l": 233.6,
"t": 278.0,
"r": 238.8,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.6,
"r_y0": 282.3,
"r_x1": 238.8,
"r_y1": 282.3,
"r_x2": 238.8,
"r_y2": 278.0,
"r_x3": 233.6,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 117,
"label": "text",
"bbox": {
"l": 256.9,
"t": 278.0,
"r": 264.6,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 282.3,
"r_x1": 264.6,
"r_y1": 282.3,
"r_x2": 264.6,
"r_y2": 278.0,
"r_x3": 256.9,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 118,
"label": "text",
"bbox": {
"l": 282.8,
"t": 278.0,
"r": 287.9,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 282.8,
"r_y0": 282.3,
"r_x1": 287.9,
"r_y1": 282.3,
"r_x2": 287.9,
"r_y2": 278.0,
"r_x3": 282.8,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 119,
"label": "text",
"bbox": {
"l": 169.6,
"t": 286.5,
"r": 174.8,
"b": 290.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 169.6,
"r_y0": 290.6,
"r_x1": 174.8,
"r_y1": 290.6,
"r_x2": 174.8,
"r_y2": 286.5,
"r_x3": 169.6,
"r_y3": 286.5,
"coord_origin": "TOPLEFT"
},
"text": "\u8a08",
"orig": "\u8a08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 120,
"label": "text",
"bbox": {
"l": 183.1,
"t": 285.5,
"r": 190.9,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 289.8,
"r_x1": 190.9,
"r_y1": 289.8,
"r_x2": 190.9,
"r_y2": 285.5,
"r_x3": 183.1,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "945",
"orig": "945",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 121,
"label": "text",
"bbox": {
"l": 207.7,
"t": 285.5,
"r": 215.4,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 289.8,
"r_x1": 215.4,
"r_y1": 289.8,
"r_x2": 215.4,
"r_y2": 285.5,
"r_x3": 207.7,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "294",
"orig": "294",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 122,
"label": "text",
"bbox": {
"l": 232.3,
"t": 285.5,
"r": 240.0,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 289.8,
"r_x1": 240.0,
"r_y1": 289.8,
"r_x2": 240.0,
"r_y2": 285.5,
"r_x3": 232.3,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "651",
"orig": "651",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 123,
"label": "text",
"bbox": {
"l": 255.8,
"t": 285.5,
"r": 265.8,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.8,
"r_y0": 289.8,
"r_x1": 265.8,
"r_y1": 289.8,
"r_x2": 265.8,
"r_y2": 285.5,
"r_x3": 255.8,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "1122",
"orig": "1122",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 124,
"label": "text",
"bbox": {
"l": 281.5,
"t": 285.5,
"r": 289.2,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 289.8,
"r_x1": 289.2,
"r_y1": 289.8,
"r_x2": 289.2,
"r_y2": 285.5,
"r_x3": 281.5,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "955",
"orig": "955",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"lcel",
"ched",
"lcel",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 10,
"num_cols": 6,
"table_cells": [
{
"bbox": {
"l": 209.9,
"t": 222.2,
"r": 241.0,
"b": 226.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 4,
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 263.8,
"t": 222.2,
"r": 284.5,
"b": 226.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 4,
"end_col_offset_idx": 6,
"text": "\u53c2\u8003\u6587\u732e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 110.2,
"t": 229.7,
"r": 120.6,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u51fa\u5178",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 175.4,
"t": 229.7,
"r": 196.1,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "\u30d5\u30a1\u30a4\u30eb \u6570",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 209.6,
"t": 229.7,
"r": 220.0,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "\u82f1\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 229.2,
"t": 229.7,
"r": 244.8,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "\u65e5\u672c\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.1,
"t": 229.7,
"r": 266.5,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "\u82f1\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 278.4,
"t": 229.7,
"r": 293.9,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "\u65e5\u672c\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.5,
"t": 236.4,
"r": 162.7,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Association for Computational Linguistics(ACL2003)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 184.4,
"t": 236.4,
"r": 189.6,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "65",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 209.0,
"t": 236.4,
"r": 214.2,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "65",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 234.9,
"t": 236.4,
"r": 237.5,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.9,
"t": 236.4,
"r": 264.6,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 284.1,
"t": 236.4,
"r": 286.6,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.5,
"t": 242.6,
"r": 139.7,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Computational Linguistics(COLING2002)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.1,
"t": 242.6,
"r": 190.9,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "140",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 207.7,
"t": 242.6,
"r": 215.4,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "140",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 234.9,
"t": 242.6,
"r": 237.5,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.9,
"t": 242.6,
"r": 264.6,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 284.1,
"t": 242.6,
"r": 286.6,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.5,
"t": 249.8,
"r": 97.0,
"b": 254.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a 2003 \u5e74\u7dcf\u5408\u5927\u4f1a",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.1,
"t": 248.8,
"r": 190.9,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.3,
"t": 248.8,
"r": 212.9,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.3,
"t": 248.8,
"r": 240.0,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "142",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.9,
"t": 248.8,
"r": 264.6,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "223",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.5,
"t": 248.8,
"r": 289.2,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "147",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.5,
"t": 257.3,
"r": 91.8,
"b": 261.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c 65 \u56de\u5168\u56fd\u5927\u4f1a (2003)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.1,
"t": 256.3,
"r": 190.9,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "177",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.3,
"t": 256.3,
"r": 212.9,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.3,
"t": 256.3,
"r": 240.0,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "176",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.9,
"t": 256.3,
"r": 264.6,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.5,
"t": 256.3,
"r": 289.2,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "236",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.5,
"t": 264.5,
"r": 60.7,
"b": 268.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u7b2c 17 \u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a (2003)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.1,
"t": 263.5,
"r": 190.9,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "208",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.3,
"t": 263.5,
"r": 212.9,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.3,
"t": 263.5,
"r": 240.0,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "203",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.9,
"t": 263.5,
"r": 264.6,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "152",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.5,
"t": 263.5,
"r": 289.2,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "244",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.5,
"t": 271.7,
"r": 107.4,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c 146 \u301c 155 \u56de",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 184.4,
"t": 270.8,
"r": 189.6,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "98",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.3,
"t": 270.8,
"r": 212.9,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 233.6,
"t": 270.8,
"r": 238.8,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "96",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.9,
"t": 270.8,
"r": 264.6,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.5,
"t": 270.8,
"r": 289.2,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "232",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.5,
"t": 279.0,
"r": 68.7,
"b": 283.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "WWW \u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.1,
"t": 278.0,
"r": 190.9,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "107",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 209.0,
"t": 278.0,
"r": 214.2,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "73",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 233.6,
"t": 278.0,
"r": 238.8,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "34",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.9,
"t": 278.0,
"r": 264.6,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "147",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 282.8,
"t": 278.0,
"r": 287.9,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "96",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 169.6,
"t": 286.5,
"r": 174.8,
"b": 290.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u8a08",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.1,
"t": 285.5,
"r": 190.9,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "945",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 207.7,
"t": 285.5,
"r": 215.4,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "294",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.3,
"t": 285.5,
"r": 240.0,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "651",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 255.8,
"t": 285.5,
"r": 265.8,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "1122",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.5,
"t": 285.5,
"r": 289.2,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "955",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
"7": {
"label": "table",
"id": 7,
"page_no": 7,
"cluster": {
"id": 7,
"label": "table",
"bbox": {
"l": 304.9,
"t": 218.5,
"r": 550.2,
"b": 287.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.0,
"r_y0": 226.7,
"r_x1": 542.0,
"r_y1": 226.7,
"r_x2": 542.0,
"r_y2": 221.6,
"r_x3": 459.0,
"r_y3": 221.6,
"coord_origin": "TOPLEFT"
},
"text": "Weighted Average Grant Date Fair",
"orig": "Weighted Average Grant Date Fair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.8,
"r_y0": 232.9,
"r_x1": 507.2,
"r_y1": 232.9,
"r_x2": 507.2,
"r_y2": 227.8,
"r_x3": 493.8,
"r_y3": 227.8,
"coord_origin": "TOPLEFT"
},
"text": "Value",
"orig": "Value",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.2,
"r_y0": 241.8,
"r_x1": 400.7,
"r_y1": 241.8,
"r_x2": 400.7,
"r_y2": 236.7,
"r_x3": 393.2,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "RS",
"orig": "RS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 241.8,
"r_x1": 404.6,
"r_y1": 241.8,
"r_x2": 404.6,
"r_y2": 236.7,
"r_x3": 400.7,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "U",
"orig": "U",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 404.6,
"r_y0": 241.8,
"r_x1": 407.3,
"r_y1": 241.8,
"r_x2": 407.3,
"r_y2": 236.7,
"r_x3": 404.6,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "s",
"orig": "s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 392.1,
"r_y0": 226.6,
"r_x1": 438.0,
"r_y1": 226.6,
"r_x2": 438.0,
"r_y2": 221.6,
"r_x3": 392.1,
"r_y3": 221.6,
"coord_origin": "TOPLEFT"
},
"text": "Shares (in millions)",
"orig": "Shares (in millions)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.2,
"r_y0": 241.8,
"r_x1": 441.0,
"r_y1": 241.8,
"r_x2": 441.0,
"r_y2": 236.7,
"r_x3": 427.2,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.4,
"r_y0": 241.8,
"r_x1": 482.5,
"r_y1": 241.8,
"r_x2": 482.5,
"r_y2": 236.7,
"r_x3": 468.4,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "RSUs",
"orig": "RSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.9,
"r_y0": 241.8,
"r_x1": 530.7,
"r_y1": 241.8,
"r_x2": 530.7,
"r_y2": 236.7,
"r_x3": 516.9,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 249.7,
"r_x1": 355.7,
"r_y1": 249.7,
"r_x2": 355.7,
"r_y2": 244.6,
"r_x3": 306.1,
"r_y3": 244.6,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on Janua",
"orig": "Nonvested on Janua",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 355.7,
"r_y0": 249.7,
"r_x1": 364.7,
"r_y1": 249.7,
"r_x2": 364.7,
"r_y2": 244.6,
"r_x3": 355.7,
"r_y3": 244.6,
"coord_origin": "TOPLEFT"
},
"text": "ry 1",
"orig": "ry 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 250.0,
"r_x1": 400.8,
"r_y1": 250.0,
"r_x2": 400.8,
"r_y2": 244.9,
"r_x3": 396.2,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.8,
"r_y0": 250.0,
"r_x1": 403.8,
"r_y1": 250.0,
"r_x2": 403.8,
"r_y2": 244.9,
"r_x3": 400.8,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.8,
"r_y0": 250.0,
"r_x1": 437.3,
"r_y1": 250.0,
"r_x2": 437.3,
"r_y2": 244.9,
"r_x3": 429.8,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.5,
"r_y0": 250.0,
"r_x1": 478.4,
"r_y1": 250.0,
"r_x2": 478.4,
"r_y2": 244.9,
"r_x3": 465.5,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "90.10",
"orig": "90.10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 481.0,
"r_y0": 250.0,
"r_x1": 483.6,
"r_y1": 250.0,
"r_x2": 483.6,
"r_y2": 244.9,
"r_x3": 481.0,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "$",
"orig": "$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.4,
"r_y0": 250.0,
"r_x1": 531.5,
"r_y1": 250.0,
"r_x2": 531.5,
"r_y2": 244.9,
"r_x3": 513.4,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "$ 91.19",
"orig": "$ 91.19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 258.7,
"r_x1": 325.6,
"r_y1": 258.7,
"r_x2": 325.6,
"r_y2": 253.7,
"r_x3": 306.1,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Granted",
"orig": "Granted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 258.7,
"r_x1": 400.8,
"r_y1": 258.7,
"r_x2": 400.8,
"r_y2": 253.7,
"r_x3": 396.2,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "0.",
"orig": "0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.8,
"r_y0": 258.7,
"r_x1": 403.8,
"r_y1": 258.7,
"r_x2": 403.8,
"r_y2": 253.7,
"r_x3": 400.8,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.8,
"r_y0": 258.7,
"r_x1": 437.3,
"r_y1": 258.7,
"r_x2": 437.3,
"r_y2": 253.7,
"r_x3": 429.8,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "0.1",
"orig": "0.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.4,
"r_y0": 258.7,
"r_x1": 482.5,
"r_y1": 258.7,
"r_x2": 482.5,
"r_y2": 253.7,
"r_x3": 466.4,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "117.44",
"orig": "117.44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.3,
"r_y0": 258.7,
"r_x1": 530.8,
"r_y1": 258.7,
"r_x2": 530.8,
"r_y2": 253.7,
"r_x3": 514.3,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "122.41",
"orig": "122.41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 266.6,
"r_x1": 322.6,
"r_y1": 266.6,
"r_x2": 322.6,
"r_y2": 261.5,
"r_x3": 306.1,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "Vested",
"orig": "Vested",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.4,
"r_y0": 266.6,
"r_x1": 400.7,
"r_y1": 266.6,
"r_x2": 400.7,
"r_y2": 261.5,
"r_x3": 394.4,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 266.6,
"r_x1": 403.7,
"r_y1": 266.6,
"r_x2": 403.7,
"r_y2": 261.5,
"r_x3": 400.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.7,
"r_y0": 266.6,
"r_x1": 405.5,
"r_y1": 266.6,
"r_x2": 405.5,
"r_y2": 261.5,
"r_x3": 403.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.7,
"r_y0": 266.6,
"r_x1": 438.8,
"r_y1": 266.6,
"r_x2": 438.8,
"r_y2": 261.5,
"r_x3": 427.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "(0.1)",
"orig": "(0.1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.6,
"r_y0": 266.6,
"r_x1": 482.1,
"r_y1": 266.6,
"r_x2": 482.1,
"r_y2": 261.5,
"r_x3": 468.6,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "87.08",
"orig": "87.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.0,
"r_y0": 266.6,
"r_x1": 529.5,
"r_y1": 266.6,
"r_x2": 529.5,
"r_y2": 261.5,
"r_x3": 516.0,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "81.14",
"orig": "81.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 274.7,
"r_x1": 356.2,
"r_y1": 274.7,
"r_x2": 356.2,
"r_y2": 269.6,
"r_x3": 306.1,
"r_y3": 269.6,
"coord_origin": "TOPLEFT"
},
"text": "Canceled or forfeited",
"orig": "Canceled or forfeited",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.4,
"r_y0": 275.4,
"r_x1": 400.7,
"r_y1": 275.4,
"r_x2": 400.7,
"r_y2": 270.3,
"r_x3": 394.4,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 275.4,
"r_x1": 403.7,
"r_y1": 275.4,
"r_x2": 403.7,
"r_y2": 270.3,
"r_x3": 400.7,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.7,
"r_y0": 275.4,
"r_x1": 405.5,
"r_y1": 275.4,
"r_x2": 405.5,
"r_y2": 270.3,
"r_x3": 403.7,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.0,
"r_y0": 275.4,
"r_x1": 436.4,
"r_y1": 275.4,
"r_x2": 436.4,
"r_y2": 270.3,
"r_x3": 431.0,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.8,
"r_y0": 275.4,
"r_x1": 482.4,
"r_y1": 275.4,
"r_x2": 482.4,
"r_y2": 270.3,
"r_x3": 465.8,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "102.01",
"orig": "102.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.0,
"r_y0": 275.4,
"r_x1": 529.5,
"r_y1": 275.4,
"r_x2": 529.5,
"r_y2": 270.3,
"r_x3": 516.0,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "92.18",
"orig": "92.18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 283.6,
"r_x1": 373.4,
"r_y1": 283.6,
"r_x2": 373.4,
"r_y2": 278.5,
"r_x3": 306.1,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on December 31",
"orig": "Nonvested on December 31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 283.6,
"r_x1": 403.8,
"r_y1": 283.6,
"r_x2": 403.8,
"r_y2": 278.5,
"r_x3": 396.2,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "1.0",
"orig": "1.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.5,
"r_y0": 283.6,
"r_x1": 437.0,
"r_y1": 283.6,
"r_x2": 437.0,
"r_y2": 278.5,
"r_x3": 429.5,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.7,
"r_y0": 283.6,
"r_x1": 484.7,
"r_y1": 283.6,
"r_x2": 484.7,
"r_y2": 278.5,
"r_x3": 463.7,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "104.85 $",
"orig": "104.85 $",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.0,
"r_y0": 283.6,
"r_x1": 534.0,
"r_y1": 283.6,
"r_x2": 534.0,
"r_y2": 278.5,
"r_x3": 513.0,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "$ 104.51",
"orig": "$ 104.51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 125,
"label": "text",
"bbox": {
"l": 459.0,
"t": 221.6,
"r": 542.0,
"b": 226.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.0,
"r_y0": 226.7,
"r_x1": 542.0,
"r_y1": 226.7,
"r_x2": 542.0,
"r_y2": 221.6,
"r_x3": 459.0,
"r_y3": 221.6,
"coord_origin": "TOPLEFT"
},
"text": "Weighted Average Grant Date Fair",
"orig": "Weighted Average Grant Date Fair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 126,
"label": "text",
"bbox": {
"l": 493.8,
"t": 227.8,
"r": 507.2,
"b": 232.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.8,
"r_y0": 232.9,
"r_x1": 507.2,
"r_y1": 232.9,
"r_x2": 507.2,
"r_y2": 227.8,
"r_x3": 493.8,
"r_y3": 227.8,
"coord_origin": "TOPLEFT"
},
"text": "Value",
"orig": "Value",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 127,
"label": "text",
"bbox": {
"l": 393.2,
"t": 236.7,
"r": 400.7,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.2,
"r_y0": 241.8,
"r_x1": 400.7,
"r_y1": 241.8,
"r_x2": 400.7,
"r_y2": 236.7,
"r_x3": 393.2,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "RS",
"orig": "RS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 128,
"label": "text",
"bbox": {
"l": 400.7,
"t": 236.7,
"r": 404.6,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 241.8,
"r_x1": 404.6,
"r_y1": 241.8,
"r_x2": 404.6,
"r_y2": 236.7,
"r_x3": 400.7,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "U",
"orig": "U",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 129,
"label": "text",
"bbox": {
"l": 404.6,
"t": 236.7,
"r": 407.3,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 404.6,
"r_y0": 241.8,
"r_x1": 407.3,
"r_y1": 241.8,
"r_x2": 407.3,
"r_y2": 236.7,
"r_x3": 404.6,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "s",
"orig": "s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 130,
"label": "text",
"bbox": {
"l": 392.1,
"t": 221.6,
"r": 438.0,
"b": 226.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 392.1,
"r_y0": 226.6,
"r_x1": 438.0,
"r_y1": 226.6,
"r_x2": 438.0,
"r_y2": 221.6,
"r_x3": 392.1,
"r_y3": 221.6,
"coord_origin": "TOPLEFT"
},
"text": "Shares (in millions)",
"orig": "Shares (in millions)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 131,
"label": "text",
"bbox": {
"l": 427.2,
"t": 236.7,
"r": 441.0,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.2,
"r_y0": 241.8,
"r_x1": 441.0,
"r_y1": 241.8,
"r_x2": 441.0,
"r_y2": 236.7,
"r_x3": 427.2,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 132,
"label": "text",
"bbox": {
"l": 468.4,
"t": 236.7,
"r": 482.5,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.4,
"r_y0": 241.8,
"r_x1": 482.5,
"r_y1": 241.8,
"r_x2": 482.5,
"r_y2": 236.7,
"r_x3": 468.4,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "RSUs",
"orig": "RSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 133,
"label": "text",
"bbox": {
"l": 516.9,
"t": 236.7,
"r": 530.7,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.9,
"r_y0": 241.8,
"r_x1": 530.7,
"r_y1": 241.8,
"r_x2": 530.7,
"r_y2": 236.7,
"r_x3": 516.9,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 134,
"label": "text",
"bbox": {
"l": 306.1,
"t": 244.6,
"r": 355.7,
"b": 249.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 249.7,
"r_x1": 355.7,
"r_y1": 249.7,
"r_x2": 355.7,
"r_y2": 244.6,
"r_x3": 306.1,
"r_y3": 244.6,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on Janua",
"orig": "Nonvested on Janua",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 135,
"label": "text",
"bbox": {
"l": 355.7,
"t": 244.6,
"r": 364.7,
"b": 249.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 355.7,
"r_y0": 249.7,
"r_x1": 364.7,
"r_y1": 249.7,
"r_x2": 364.7,
"r_y2": 244.6,
"r_x3": 355.7,
"r_y3": 244.6,
"coord_origin": "TOPLEFT"
},
"text": "ry 1",
"orig": "ry 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 136,
"label": "text",
"bbox": {
"l": 396.2,
"t": 244.9,
"r": 400.8,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 250.0,
"r_x1": 400.8,
"r_y1": 250.0,
"r_x2": 400.8,
"r_y2": 244.9,
"r_x3": 396.2,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 137,
"label": "text",
"bbox": {
"l": 400.8,
"t": 244.9,
"r": 403.8,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.8,
"r_y0": 250.0,
"r_x1": 403.8,
"r_y1": 250.0,
"r_x2": 403.8,
"r_y2": 244.9,
"r_x3": 400.8,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 138,
"label": "text",
"bbox": {
"l": 429.8,
"t": 244.9,
"r": 437.3,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.8,
"r_y0": 250.0,
"r_x1": 437.3,
"r_y1": 250.0,
"r_x2": 437.3,
"r_y2": 244.9,
"r_x3": 429.8,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 139,
"label": "text",
"bbox": {
"l": 465.5,
"t": 244.9,
"r": 478.4,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.5,
"r_y0": 250.0,
"r_x1": 478.4,
"r_y1": 250.0,
"r_x2": 478.4,
"r_y2": 244.9,
"r_x3": 465.5,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "90.10",
"orig": "90.10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 140,
"label": "text",
"bbox": {
"l": 481.0,
"t": 244.9,
"r": 483.6,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 481.0,
"r_y0": 250.0,
"r_x1": 483.6,
"r_y1": 250.0,
"r_x2": 483.6,
"r_y2": 244.9,
"r_x3": 481.0,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "$",
"orig": "$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 141,
"label": "text",
"bbox": {
"l": 513.4,
"t": 244.9,
"r": 531.5,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.4,
"r_y0": 250.0,
"r_x1": 531.5,
"r_y1": 250.0,
"r_x2": 531.5,
"r_y2": 244.9,
"r_x3": 513.4,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "$ 91.19",
"orig": "$ 91.19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 142,
"label": "text",
"bbox": {
"l": 306.1,
"t": 253.7,
"r": 325.6,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 258.7,
"r_x1": 325.6,
"r_y1": 258.7,
"r_x2": 325.6,
"r_y2": 253.7,
"r_x3": 306.1,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Granted",
"orig": "Granted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 143,
"label": "text",
"bbox": {
"l": 396.2,
"t": 253.7,
"r": 400.8,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 258.7,
"r_x1": 400.8,
"r_y1": 258.7,
"r_x2": 400.8,
"r_y2": 253.7,
"r_x3": 396.2,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "0.",
"orig": "0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 144,
"label": "text",
"bbox": {
"l": 400.8,
"t": 253.7,
"r": 403.8,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.8,
"r_y0": 258.7,
"r_x1": 403.8,
"r_y1": 258.7,
"r_x2": 403.8,
"r_y2": 253.7,
"r_x3": 400.8,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 145,
"label": "text",
"bbox": {
"l": 429.8,
"t": 253.7,
"r": 437.3,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.8,
"r_y0": 258.7,
"r_x1": 437.3,
"r_y1": 258.7,
"r_x2": 437.3,
"r_y2": 253.7,
"r_x3": 429.8,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "0.1",
"orig": "0.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 146,
"label": "text",
"bbox": {
"l": 466.4,
"t": 253.7,
"r": 482.5,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.4,
"r_y0": 258.7,
"r_x1": 482.5,
"r_y1": 258.7,
"r_x2": 482.5,
"r_y2": 253.7,
"r_x3": 466.4,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "117.44",
"orig": "117.44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 147,
"label": "text",
"bbox": {
"l": 514.3,
"t": 253.7,
"r": 530.8,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.3,
"r_y0": 258.7,
"r_x1": 530.8,
"r_y1": 258.7,
"r_x2": 530.8,
"r_y2": 253.7,
"r_x3": 514.3,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "122.41",
"orig": "122.41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 148,
"label": "text",
"bbox": {
"l": 306.1,
"t": 261.5,
"r": 322.6,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 266.6,
"r_x1": 322.6,
"r_y1": 266.6,
"r_x2": 322.6,
"r_y2": 261.5,
"r_x3": 306.1,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "Vested",
"orig": "Vested",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 149,
"label": "text",
"bbox": {
"l": 394.4,
"t": 261.5,
"r": 400.7,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.4,
"r_y0": 266.6,
"r_x1": 400.7,
"r_y1": 266.6,
"r_x2": 400.7,
"r_y2": 261.5,
"r_x3": 394.4,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 150,
"label": "text",
"bbox": {
"l": 400.7,
"t": 261.5,
"r": 403.7,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 266.6,
"r_x1": 403.7,
"r_y1": 266.6,
"r_x2": 403.7,
"r_y2": 261.5,
"r_x3": 400.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 151,
"label": "text",
"bbox": {
"l": 403.7,
"t": 261.5,
"r": 405.5,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.7,
"r_y0": 266.6,
"r_x1": 405.5,
"r_y1": 266.6,
"r_x2": 405.5,
"r_y2": 261.5,
"r_x3": 403.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 152,
"label": "text",
"bbox": {
"l": 427.7,
"t": 261.5,
"r": 438.8,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.7,
"r_y0": 266.6,
"r_x1": 438.8,
"r_y1": 266.6,
"r_x2": 438.8,
"r_y2": 261.5,
"r_x3": 427.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "(0.1)",
"orig": "(0.1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 153,
"label": "text",
"bbox": {
"l": 468.6,
"t": 261.5,
"r": 482.1,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.6,
"r_y0": 266.6,
"r_x1": 482.1,
"r_y1": 266.6,
"r_x2": 482.1,
"r_y2": 261.5,
"r_x3": 468.6,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "87.08",
"orig": "87.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 154,
"label": "text",
"bbox": {
"l": 516.0,
"t": 261.5,
"r": 529.5,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.0,
"r_y0": 266.6,
"r_x1": 529.5,
"r_y1": 266.6,
"r_x2": 529.5,
"r_y2": 261.5,
"r_x3": 516.0,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "81.14",
"orig": "81.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 155,
"label": "text",
"bbox": {
"l": 306.1,
"t": 269.6,
"r": 356.2,
"b": 274.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 274.7,
"r_x1": 356.2,
"r_y1": 274.7,
"r_x2": 356.2,
"r_y2": 269.6,
"r_x3": 306.1,
"r_y3": 269.6,
"coord_origin": "TOPLEFT"
},
"text": "Canceled or forfeited",
"orig": "Canceled or forfeited",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 156,
"label": "text",
"bbox": {
"l": 394.4,
"t": 270.3,
"r": 400.7,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.4,
"r_y0": 275.4,
"r_x1": 400.7,
"r_y1": 275.4,
"r_x2": 400.7,
"r_y2": 270.3,
"r_x3": 394.4,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 157,
"label": "text",
"bbox": {
"l": 400.7,
"t": 270.3,
"r": 403.7,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 275.4,
"r_x1": 403.7,
"r_y1": 275.4,
"r_x2": 403.7,
"r_y2": 270.3,
"r_x3": 400.7,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 158,
"label": "text",
"bbox": {
"l": 403.7,
"t": 270.3,
"r": 405.5,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.7,
"r_y0": 275.4,
"r_x1": 405.5,
"r_y1": 275.4,
"r_x2": 405.5,
"r_y2": 270.3,
"r_x3": 403.7,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 159,
"label": "text",
"bbox": {
"l": 431.0,
"t": 270.3,
"r": 436.4,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.0,
"r_y0": 275.4,
"r_x1": 436.4,
"r_y1": 275.4,
"r_x2": 436.4,
"r_y2": 270.3,
"r_x3": 431.0,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 160,
"label": "text",
"bbox": {
"l": 465.8,
"t": 270.3,
"r": 482.4,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.8,
"r_y0": 275.4,
"r_x1": 482.4,
"r_y1": 275.4,
"r_x2": 482.4,
"r_y2": 270.3,
"r_x3": 465.8,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "102.01",
"orig": "102.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 161,
"label": "text",
"bbox": {
"l": 516.0,
"t": 270.3,
"r": 529.5,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.0,
"r_y0": 275.4,
"r_x1": 529.5,
"r_y1": 275.4,
"r_x2": 529.5,
"r_y2": 270.3,
"r_x3": 516.0,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "92.18",
"orig": "92.18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 162,
"label": "text",
"bbox": {
"l": 306.1,
"t": 278.5,
"r": 373.4,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 283.6,
"r_x1": 373.4,
"r_y1": 283.6,
"r_x2": 373.4,
"r_y2": 278.5,
"r_x3": 306.1,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on December 31",
"orig": "Nonvested on December 31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 163,
"label": "text",
"bbox": {
"l": 396.2,
"t": 278.5,
"r": 403.8,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 283.6,
"r_x1": 403.8,
"r_y1": 283.6,
"r_x2": 403.8,
"r_y2": 278.5,
"r_x3": 396.2,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "1.0",
"orig": "1.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 164,
"label": "text",
"bbox": {
"l": 429.5,
"t": 278.5,
"r": 437.0,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.5,
"r_y0": 283.6,
"r_x1": 437.0,
"r_y1": 283.6,
"r_x2": 437.0,
"r_y2": 278.5,
"r_x3": 429.5,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 165,
"label": "text",
"bbox": {
"l": 463.7,
"t": 278.5,
"r": 484.7,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.7,
"r_y0": 283.6,
"r_x1": 484.7,
"r_y1": 283.6,
"r_x2": 484.7,
"r_y2": 278.5,
"r_x3": 463.7,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "104.85 $",
"orig": "104.85 $",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 166,
"label": "text",
"bbox": {
"l": 513.0,
"t": 278.5,
"r": 534.0,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.0,
"r_y0": 283.6,
"r_x1": 534.0,
"r_y1": 283.6,
"r_x2": 534.0,
"r_y2": 278.5,
"r_x3": 513.0,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "$ 104.51",
"orig": "$ 104.51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"lcel",
"ched",
"lcel",
"nl",
"ecel",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 7,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 459.0,
"t": 221.6,
"r": 542.0,
"b": 226.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 5,
"text": "Weighted Average Grant Date Fair Value",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 393.2,
"t": 236.7,
"r": 400.7,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "RS U s",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 392.1,
"t": 221.6,
"r": 438.0,
"b": 226.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 3,
"text": "Shares (in millions)",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 427.2,
"t": 236.7,
"r": 441.0,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "PSUs",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 468.4,
"t": 236.7,
"r": 482.5,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "RSUs",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 516.9,
"t": 236.7,
"r": 530.7,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PSUs",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.1,
"t": 244.6,
"r": 355.7,
"b": 249.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Nonvested on Janua ry 1",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 396.2,
"t": 244.9,
"r": 400.8,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "1. 1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 429.8,
"t": 244.9,
"r": 437.3,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "0.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 465.5,
"t": 244.9,
"r": 478.4,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "90.10 $",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 513.4,
"t": 244.9,
"r": 531.5,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "$ 91.19",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.1,
"t": 253.7,
"r": 325.6,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Granted",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 396.2,
"t": 253.7,
"r": 400.8,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "0. 5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 429.8,
"t": 253.7,
"r": 437.3,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "0.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 466.4,
"t": 253.7,
"r": 482.5,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "117.44",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 514.3,
"t": 253.7,
"r": 530.8,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "122.41",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.1,
"t": 261.5,
"r": 322.6,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Vested",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 394.4,
"t": 261.5,
"r": 400.7,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "(0. 5 )",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 427.7,
"t": 261.5,
"r": 438.8,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "(0.1)",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 468.6,
"t": 261.5,
"r": 482.1,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "87.08",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 516.0,
"t": 261.5,
"r": 529.5,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "81.14",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.1,
"t": 269.6,
"r": 356.2,
"b": 274.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Canceled or forfeited",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 394.4,
"t": 270.3,
"r": 400.7,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "(0. 1 )",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 431.0,
"t": 270.3,
"r": 436.4,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 465.8,
"t": 270.3,
"r": 482.4,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "102.01",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 516.0,
"t": 270.3,
"r": 529.5,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "92.18",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.1,
"t": 278.5,
"r": 373.4,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Nonvested on December 31",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 396.2,
"t": 278.5,
"r": 403.8,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "1.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 429.5,
"t": 278.5,
"r": 437.0,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "0.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 463.7,
"t": 278.5,
"r": 484.7,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "104.85 $",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 513.0,
"t": 278.5,
"r": 534.0,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "$ 104.51",
"column_header": false,
"row_header": false,
"row_section": false
}
]
}
}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "caption",
"id": 18,
"page_no": 7,
"cluster": {
"id": 18,
"label": "caption",
"bbox": {
"l": 53.8,
"t": 208.2,
"r": 385.9,
"b": 216.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.6,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.8,
"r_y0": 216.1,
"r_x1": 62.2,
"r_y1": 216.1,
"r_x2": 62.2,
"r_y2": 208.2,
"r_x3": 53.8,
"r_y3": 208.2,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.4,
"r_y0": 216.1,
"r_x1": 385.9,
"r_y1": 216.1,
"r_x2": 385.9,
"r_y2": 208.2,
"r_x3": 66.4,
"r_y3": 208.2,
"coord_origin": "TOPLEFT"
},
"text": "Structure predicted by TableFormer, with superimposed matched PDF cell text:",
"orig": "Structure predicted by TableFormer, with superimposed matched PDF cell text:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:"
},
{
"label": "section_header",
"id": 29,
"page_no": 7,
"cluster": {
"id": 29,
"label": "section_header",
"bbox": {
"l": 53.8,
"t": 94.3,
"r": 284.3,
"b": 102.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.46,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.8,
"r_y0": 102.2,
"r_x1": 284.3,
"r_y1": 102.2,
"r_x2": 284.3,
"r_y2": 94.3,
"r_x3": 53.8,
"r_y3": 94.3,
"coord_origin": "TOPLEFT"
},
"text": "Japanese language (previously unseen by TableFormer):",
"orig": "Japanese language (previously unseen by TableFormer):",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Japanese language (previously unseen by TableFormer):"
},
{
"label": "section_header",
"id": 31,
"page_no": 7,
"cluster": {
"id": 31,
"label": "section_header",
"bbox": {
"l": 304.8,
"t": 94.3,
"r": 431.1,
"b": 102.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.46,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 304.8,
"r_y0": 102.2,
"r_x1": 431.1,
"r_y1": 102.2,
"r_x2": 431.1,
"r_y2": 94.3,
"r_x3": 304.8,
"r_y3": 94.3,
"coord_origin": "TOPLEFT"
},
"text": "Example table from FinTabNet:",
"orig": "Example table from FinTabNet:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Example table from FinTabNet:"
},
{
"label": "list_item",
"id": 20,
"page_no": 7,
"cluster": {
"id": 20,
"label": "list_item",
"bbox": {
"l": 53.3,
"t": 78.7,
"r": 61.6,
"b": 86.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.58,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.3,
"r_y0": 86.6,
"r_x1": 61.6,
"r_y1": 86.6,
"r_x2": 61.6,
"r_y2": 78.7,
"r_x3": 53.3,
"r_y3": 78.7,
"coord_origin": "TOPLEFT"
},
"text": "a.",
"orig": "a.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "a."
},
{
"label": "list_item",
"id": 21,
"page_no": 7,
"cluster": {
"id": 21,
"label": "list_item",
"bbox": {
"l": 65.7,
"t": 78.7,
"r": 499.6,
"b": 86.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.54,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.7,
"r_y0": 86.6,
"r_x1": 499.6,
"r_y1": 86.6,
"r_x2": 499.6,
"r_y2": 78.7,
"r_x3": 65.7,
"r_y3": 78.7,
"coord_origin": "TOPLEFT"
},
"text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells",
"orig": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells"
},
{
"label": "table",
"id": 8,
"page_no": 7,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 53.6,
"t": 218.9,
"r": 298.6,
"b": 292.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.9,
"r_y0": 226.4,
"r_x1": 241.0,
"r_y1": 226.4,
"r_x2": 241.0,
"r_y2": 222.2,
"r_x3": 209.9,
"r_y3": 222.2,
"coord_origin": "TOPLEFT"
},
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.8,
"r_y0": 226.4,
"r_x1": 284.5,
"r_y1": 226.4,
"r_x2": 284.5,
"r_y2": 222.2,
"r_x3": 263.8,
"r_y3": 222.2,
"coord_origin": "TOPLEFT"
},
"text": "\u53c2\u8003\u6587\u732e",
"orig": "\u53c2\u8003\u6587\u732e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.2,
"r_y0": 233.8,
"r_x1": 120.6,
"r_y1": 233.8,
"r_x2": 120.6,
"r_y2": 229.7,
"r_x3": 110.2,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u51fa\u5178",
"orig": "\u51fa\u5178",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.4,
"r_y0": 233.8,
"r_x1": 196.1,
"r_y1": 233.8,
"r_x2": 196.1,
"r_y2": 229.7,
"r_x3": 175.4,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u30d5\u30a1\u30a4\u30eb",
"orig": "\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.1,
"r_y0": 233.8,
"r_x1": 201.3,
"r_y1": 233.8,
"r_x2": 201.3,
"r_y2": 229.7,
"r_x3": 196.1,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u6570",
"orig": "\u6570",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.6,
"r_y0": 233.8,
"r_x1": 220.0,
"r_y1": 233.8,
"r_x2": 220.0,
"r_y2": 229.7,
"r_x3": 209.6,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.2,
"r_y0": 233.8,
"r_x1": 244.8,
"r_y1": 233.8,
"r_x2": 244.8,
"r_y2": 229.7,
"r_x3": 229.2,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.1,
"r_y0": 233.8,
"r_x1": 266.5,
"r_y1": 233.8,
"r_x2": 266.5,
"r_y2": 229.7,
"r_x3": 256.1,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.4,
"r_y0": 233.8,
"r_x1": 293.9,
"r_y1": 233.8,
"r_x2": 293.9,
"r_y2": 229.7,
"r_x3": 278.4,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 240.8,
"r_x1": 162.7,
"r_y1": 240.8,
"r_x2": 162.7,
"r_y2": 236.4,
"r_x3": 55.5,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "Association for Computational Linguistics(ACL2003)",
"orig": "Association for Computational Linguistics(ACL2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 240.8,
"r_x1": 189.6,
"r_y1": 240.8,
"r_x2": 189.6,
"r_y2": 236.4,
"r_x3": 184.4,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 240.8,
"r_x1": 214.2,
"r_y1": 240.8,
"r_x2": 214.2,
"r_y2": 236.4,
"r_x3": 209.0,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.9,
"r_y0": 240.8,
"r_x1": 237.5,
"r_y1": 240.8,
"r_x2": 237.5,
"r_y2": 236.4,
"r_x3": 234.9,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 240.8,
"r_x1": 264.6,
"r_y1": 240.8,
"r_x2": 264.6,
"r_y2": 236.4,
"r_x3": 256.9,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.1,
"r_y0": 240.8,
"r_x1": 286.6,
"r_y1": 240.8,
"r_x2": 286.6,
"r_y2": 236.4,
"r_x3": 284.1,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 247.0,
"r_x1": 139.7,
"r_y1": 247.0,
"r_x2": 139.7,
"r_y2": 242.6,
"r_x3": 55.5,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "Computational Linguistics(COLING2002)",
"orig": "Computational Linguistics(COLING2002)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 247.0,
"r_x1": 190.9,
"r_y1": 247.0,
"r_x2": 190.9,
"r_y2": 242.6,
"r_x3": 183.1,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 247.0,
"r_x1": 215.4,
"r_y1": 247.0,
"r_x2": 215.4,
"r_y2": 242.6,
"r_x3": 207.7,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.9,
"r_y0": 247.0,
"r_x1": 237.5,
"r_y1": 247.0,
"r_x2": 237.5,
"r_y2": 242.6,
"r_x3": 234.9,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 247.0,
"r_x1": 264.6,
"r_y1": 247.0,
"r_x2": 264.6,
"r_y2": 242.6,
"r_x3": 256.9,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.1,
"r_y0": 247.0,
"r_x1": 286.6,
"r_y1": 247.0,
"r_x2": 286.6,
"r_y2": 242.6,
"r_x3": 284.1,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 254.0,
"r_x1": 97.0,
"r_y1": 254.0,
"r_x2": 97.0,
"r_y2": 249.8,
"r_x3": 55.5,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 92.7,
"r_y0": 253.9,
"r_x1": 103.0,
"r_y1": 253.9,
"r_x2": 103.0,
"r_y2": 249.6,
"r_x3": 92.7,
"r_y3": 249.6,
"coord_origin": "TOPLEFT"
},
"text": "2003",
"orig": "2003",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.0,
"r_y0": 254.0,
"r_x1": 129.0,
"r_y1": 254.0,
"r_x2": 129.0,
"r_y2": 249.8,
"r_x3": 103.0,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"orig": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 253.2,
"r_x1": 190.9,
"r_y1": 253.2,
"r_x2": 190.9,
"r_y2": 248.8,
"r_x3": 183.1,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 253.2,
"r_x1": 212.9,
"r_y1": 253.2,
"r_x2": 212.9,
"r_y2": 248.8,
"r_x3": 210.3,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 253.2,
"r_x1": 240.0,
"r_y1": 253.2,
"r_x2": 240.0,
"r_y2": 248.8,
"r_x3": 232.3,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "142",
"orig": "142",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 253.2,
"r_x1": 264.6,
"r_y1": 253.2,
"r_x2": 264.6,
"r_y2": 248.8,
"r_x3": 256.9,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "223",
"orig": "223",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 253.2,
"r_x1": 289.2,
"r_y1": 253.2,
"r_x2": 289.2,
"r_y2": 248.8,
"r_x3": 281.5,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 261.5,
"r_x1": 91.8,
"r_y1": 261.5,
"r_x2": 91.8,
"r_y2": 257.3,
"r_x3": 55.5,
"r_y3": 257.3,
"coord_origin": "TOPLEFT"
},
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.1,
"r_y0": 261.4,
"r_x1": 93.2,
"r_y1": 261.4,
"r_x2": 93.2,
"r_y2": 257.1,
"r_x3": 88.1,
"r_y3": 257.1,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.2,
"r_y0": 261.5,
"r_x1": 119.1,
"r_y1": 261.5,
"r_x2": 119.1,
"r_y2": 257.3,
"r_x3": 93.2,
"r_y3": 257.3,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.5,
"r_y0": 261.4,
"r_x1": 129.9,
"r_y1": 261.4,
"r_x2": 129.9,
"r_y2": 257.1,
"r_x3": 116.5,
"r_y3": 257.1,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 260.7,
"r_x1": 190.9,
"r_y1": 260.7,
"r_x2": 190.9,
"r_y2": 256.3,
"r_x3": 183.1,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "177",
"orig": "177",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 260.7,
"r_x1": 212.9,
"r_y1": 260.7,
"r_x2": 212.9,
"r_y2": 256.3,
"r_x3": 210.3,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 260.7,
"r_x1": 240.0,
"r_y1": 260.7,
"r_x2": 240.0,
"r_y2": 256.3,
"r_x3": 232.3,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "176",
"orig": "176",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 260.7,
"r_x1": 264.6,
"r_y1": 260.7,
"r_x2": 264.6,
"r_y2": 256.3,
"r_x3": 256.9,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 260.7,
"r_x1": 289.2,
"r_y1": 260.7,
"r_x2": 289.2,
"r_y2": 256.3,
"r_x3": 281.5,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "236",
"orig": "236",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 268.7,
"r_x1": 60.7,
"r_y1": 268.7,
"r_x2": 60.7,
"r_y2": 264.5,
"r_x3": 55.5,
"r_y3": 264.5,
"coord_origin": "TOPLEFT"
},
"text": "\u7b2c",
"orig": "\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.2,
"r_y0": 268.7,
"r_x1": 65.3,
"r_y1": 268.7,
"r_x2": 65.3,
"r_y2": 264.3,
"r_x3": 60.2,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.3,
"r_y0": 268.7,
"r_x1": 122.4,
"r_y1": 268.7,
"r_x2": 122.4,
"r_y2": 264.5,
"r_x3": 65.3,
"r_y3": 264.5,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.5,
"r_y0": 268.7,
"r_x1": 129.9,
"r_y1": 268.7,
"r_x2": 129.9,
"r_y2": 264.3,
"r_x3": 116.5,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 267.9,
"r_x1": 190.9,
"r_y1": 267.9,
"r_x2": 190.9,
"r_y2": 263.5,
"r_x3": 183.1,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "208",
"orig": "208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 267.9,
"r_x1": 212.9,
"r_y1": 267.9,
"r_x2": 212.9,
"r_y2": 263.5,
"r_x3": 210.3,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 267.9,
"r_x1": 240.0,
"r_y1": 267.9,
"r_x2": 240.0,
"r_y2": 263.5,
"r_x3": 232.3,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "203",
"orig": "203",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 267.9,
"r_x1": 264.6,
"r_y1": 267.9,
"r_x2": 264.6,
"r_y2": 263.5,
"r_x3": 256.9,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "152",
"orig": "152",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 267.9,
"r_x1": 289.2,
"r_y1": 267.9,
"r_x2": 289.2,
"r_y2": 263.5,
"r_x3": 281.5,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "244",
"orig": "244",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 275.9,
"r_x1": 107.4,
"r_y1": 275.9,
"r_x2": 107.4,
"r_y2": 271.7,
"r_x3": 55.5,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 102.0,
"r_y0": 275.9,
"r_x1": 109.7,
"r_y1": 275.9,
"r_x2": 109.7,
"r_y2": 271.5,
"r_x3": 102.0,
"r_y3": 271.5,
"coord_origin": "TOPLEFT"
},
"text": "146",
"orig": "146",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 109.7,
"r_y0": 275.9,
"r_x1": 114.9,
"r_y1": 275.9,
"r_x2": 114.9,
"r_y2": 271.7,
"r_x3": 109.7,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u301c",
"orig": "\u301c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 114.4,
"r_y0": 275.9,
"r_x1": 122.1,
"r_y1": 275.9,
"r_x2": 122.1,
"r_y2": 271.5,
"r_x3": 114.4,
"r_y3": 271.5,
"coord_origin": "TOPLEFT"
},
"text": "155",
"orig": "155",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.1,
"r_y0": 275.9,
"r_x1": 127.3,
"r_y1": 275.9,
"r_x2": 127.3,
"r_y2": 271.7,
"r_x3": 122.1,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u56de",
"orig": "\u56de",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 275.1,
"r_x1": 189.6,
"r_y1": 275.1,
"r_x2": 189.6,
"r_y2": 270.8,
"r_x3": 184.4,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "98",
"orig": "98",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 275.1,
"r_x1": 212.9,
"r_y1": 275.1,
"r_x2": 212.9,
"r_y2": 270.8,
"r_x3": 210.3,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.6,
"r_y0": 275.1,
"r_x1": 238.8,
"r_y1": 275.1,
"r_x2": 238.8,
"r_y2": 270.8,
"r_x3": 233.6,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 275.1,
"r_x1": 264.6,
"r_y1": 275.1,
"r_x2": 264.6,
"r_y2": 270.8,
"r_x3": 256.9,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 275.1,
"r_x1": 289.2,
"r_y1": 275.1,
"r_x2": 289.2,
"r_y2": 270.8,
"r_x3": 281.5,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "232",
"orig": "232",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 283.4,
"r_x1": 68.7,
"r_y1": 283.4,
"r_x2": 68.7,
"r_y2": 279.0,
"r_x3": 55.5,
"r_y3": 279.0,
"coord_origin": "TOPLEFT"
},
"text": "WWW",
"orig": "WWW",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.7,
"r_y0": 283.4,
"r_x1": 110.2,
"r_y1": 283.4,
"r_x2": 110.2,
"r_y2": 279.2,
"r_x3": 68.7,
"r_y3": 279.2,
"coord_origin": "TOPLEFT"
},
"text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 282.3,
"r_x1": 190.9,
"r_y1": 282.3,
"r_x2": 190.9,
"r_y2": 278.0,
"r_x3": 183.1,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "107",
"orig": "107",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 282.3,
"r_x1": 214.2,
"r_y1": 282.3,
"r_x2": 214.2,
"r_y2": 278.0,
"r_x3": 209.0,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "73",
"orig": "73",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.6,
"r_y0": 282.3,
"r_x1": 238.8,
"r_y1": 282.3,
"r_x2": 238.8,
"r_y2": 278.0,
"r_x3": 233.6,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 282.3,
"r_x1": 264.6,
"r_y1": 282.3,
"r_x2": 264.6,
"r_y2": 278.0,
"r_x3": 256.9,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 282.8,
"r_y0": 282.3,
"r_x1": 287.9,
"r_y1": 282.3,
"r_x2": 287.9,
"r_y2": 278.0,
"r_x3": 282.8,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 169.6,
"r_y0": 290.6,
"r_x1": 174.8,
"r_y1": 290.6,
"r_x2": 174.8,
"r_y2": 286.5,
"r_x3": 169.6,
"r_y3": 286.5,
"coord_origin": "TOPLEFT"
},
"text": "\u8a08",
"orig": "\u8a08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 289.8,
"r_x1": 190.9,
"r_y1": 289.8,
"r_x2": 190.9,
"r_y2": 285.5,
"r_x3": 183.1,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "945",
"orig": "945",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 289.8,
"r_x1": 215.4,
"r_y1": 289.8,
"r_x2": 215.4,
"r_y2": 285.5,
"r_x3": 207.7,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "294",
"orig": "294",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 289.8,
"r_x1": 240.0,
"r_y1": 289.8,
"r_x2": 240.0,
"r_y2": 285.5,
"r_x3": 232.3,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "651",
"orig": "651",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.8,
"r_y0": 289.8,
"r_x1": 265.8,
"r_y1": 289.8,
"r_x2": 265.8,
"r_y2": 285.5,
"r_x3": 255.8,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "1122",
"orig": "1122",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 289.8,
"r_x1": 289.2,
"r_y1": 289.8,
"r_x2": 289.2,
"r_y2": 285.5,
"r_x3": 281.5,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "955",
"orig": "955",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 55,
"label": "text",
"bbox": {
"l": 209.9,
"t": 222.2,
"r": 241.0,
"b": 226.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.9,
"r_y0": 226.4,
"r_x1": 241.0,
"r_y1": 226.4,
"r_x2": 241.0,
"r_y2": 222.2,
"r_x3": 209.9,
"r_y3": 222.2,
"coord_origin": "TOPLEFT"
},
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 263.8,
"t": 222.2,
"r": 284.5,
"b": 226.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.8,
"r_y0": 226.4,
"r_x1": 284.5,
"r_y1": 226.4,
"r_x2": 284.5,
"r_y2": 222.2,
"r_x3": 263.8,
"r_y3": 222.2,
"coord_origin": "TOPLEFT"
},
"text": "\u53c2\u8003\u6587\u732e",
"orig": "\u53c2\u8003\u6587\u732e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 110.2,
"t": 229.7,
"r": 120.6,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.2,
"r_y0": 233.8,
"r_x1": 120.6,
"r_y1": 233.8,
"r_x2": 120.6,
"r_y2": 229.7,
"r_x3": 110.2,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u51fa\u5178",
"orig": "\u51fa\u5178",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 175.4,
"t": 229.7,
"r": 196.1,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.4,
"r_y0": 233.8,
"r_x1": 196.1,
"r_y1": 233.8,
"r_x2": 196.1,
"r_y2": 229.7,
"r_x3": 175.4,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u30d5\u30a1\u30a4\u30eb",
"orig": "\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 196.1,
"t": 229.7,
"r": 201.3,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.1,
"r_y0": 233.8,
"r_x1": 201.3,
"r_y1": 233.8,
"r_x2": 201.3,
"r_y2": 229.7,
"r_x3": 196.1,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u6570",
"orig": "\u6570",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 209.6,
"t": 229.7,
"r": 220.0,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.6,
"r_y0": 233.8,
"r_x1": 220.0,
"r_y1": 233.8,
"r_x2": 220.0,
"r_y2": 229.7,
"r_x3": 209.6,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 229.2,
"t": 229.7,
"r": 244.8,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.2,
"r_y0": 233.8,
"r_x1": 244.8,
"r_y1": 233.8,
"r_x2": 244.8,
"r_y2": 229.7,
"r_x3": 229.2,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 256.1,
"t": 229.7,
"r": 266.5,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.1,
"r_y0": 233.8,
"r_x1": 266.5,
"r_y1": 233.8,
"r_x2": 266.5,
"r_y2": 229.7,
"r_x3": 256.1,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 278.4,
"t": 229.7,
"r": 293.9,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.4,
"r_y0": 233.8,
"r_x1": 293.9,
"r_y1": 233.8,
"r_x2": 293.9,
"r_y2": 229.7,
"r_x3": 278.4,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 55.5,
"t": 236.4,
"r": 162.7,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 240.8,
"r_x1": 162.7,
"r_y1": 240.8,
"r_x2": 162.7,
"r_y2": 236.4,
"r_x3": 55.5,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "Association for Computational Linguistics(ACL2003)",
"orig": "Association for Computational Linguistics(ACL2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 184.4,
"t": 236.4,
"r": 189.6,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 240.8,
"r_x1": 189.6,
"r_y1": 240.8,
"r_x2": 189.6,
"r_y2": 236.4,
"r_x3": 184.4,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 209.0,
"t": 236.4,
"r": 214.2,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 240.8,
"r_x1": 214.2,
"r_y1": 240.8,
"r_x2": 214.2,
"r_y2": 236.4,
"r_x3": 209.0,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 234.9,
"t": 236.4,
"r": 237.5,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.9,
"r_y0": 240.8,
"r_x1": 237.5,
"r_y1": 240.8,
"r_x2": 237.5,
"r_y2": 236.4,
"r_x3": 234.9,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 256.9,
"t": 236.4,
"r": 264.6,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 240.8,
"r_x1": 264.6,
"r_y1": 240.8,
"r_x2": 264.6,
"r_y2": 236.4,
"r_x3": 256.9,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 284.1,
"t": 236.4,
"r": 286.6,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.1,
"r_y0": 240.8,
"r_x1": 286.6,
"r_y1": 240.8,
"r_x2": 286.6,
"r_y2": 236.4,
"r_x3": 284.1,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 55.5,
"t": 242.6,
"r": 139.7,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 247.0,
"r_x1": 139.7,
"r_y1": 247.0,
"r_x2": 139.7,
"r_y2": 242.6,
"r_x3": 55.5,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "Computational Linguistics(COLING2002)",
"orig": "Computational Linguistics(COLING2002)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 183.1,
"t": 242.6,
"r": 190.9,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 247.0,
"r_x1": 190.9,
"r_y1": 247.0,
"r_x2": 190.9,
"r_y2": 242.6,
"r_x3": 183.1,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 207.7,
"t": 242.6,
"r": 215.4,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 247.0,
"r_x1": 215.4,
"r_y1": 247.0,
"r_x2": 215.4,
"r_y2": 242.6,
"r_x3": 207.7,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 234.9,
"t": 242.6,
"r": 237.5,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.9,
"r_y0": 247.0,
"r_x1": 237.5,
"r_y1": 247.0,
"r_x2": 237.5,
"r_y2": 242.6,
"r_x3": 234.9,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 256.9,
"t": 242.6,
"r": 264.6,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 247.0,
"r_x1": 264.6,
"r_y1": 247.0,
"r_x2": 264.6,
"r_y2": 242.6,
"r_x3": 256.9,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 284.1,
"t": 242.6,
"r": 286.6,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.1,
"r_y0": 247.0,
"r_x1": 286.6,
"r_y1": 247.0,
"r_x2": 286.6,
"r_y2": 242.6,
"r_x3": 284.1,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 55.5,
"t": 249.8,
"r": 97.0,
"b": 254.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 254.0,
"r_x1": 97.0,
"r_y1": 254.0,
"r_x2": 97.0,
"r_y2": 249.8,
"r_x3": 55.5,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 92.7,
"t": 249.6,
"r": 103.0,
"b": 253.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 92.7,
"r_y0": 253.9,
"r_x1": 103.0,
"r_y1": 253.9,
"r_x2": 103.0,
"r_y2": 249.6,
"r_x3": 92.7,
"r_y3": 249.6,
"coord_origin": "TOPLEFT"
},
"text": "2003",
"orig": "2003",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 103.0,
"t": 249.8,
"r": 129.0,
"b": 254.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.0,
"r_y0": 254.0,
"r_x1": 129.0,
"r_y1": 254.0,
"r_x2": 129.0,
"r_y2": 249.8,
"r_x3": 103.0,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"orig": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 183.1,
"t": 248.8,
"r": 190.9,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 253.2,
"r_x1": 190.9,
"r_y1": 253.2,
"r_x2": 190.9,
"r_y2": 248.8,
"r_x3": 183.1,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 210.3,
"t": 248.8,
"r": 212.9,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 253.2,
"r_x1": 212.9,
"r_y1": 253.2,
"r_x2": 212.9,
"r_y2": 248.8,
"r_x3": 210.3,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 232.3,
"t": 248.8,
"r": 240.0,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 253.2,
"r_x1": 240.0,
"r_y1": 253.2,
"r_x2": 240.0,
"r_y2": 248.8,
"r_x3": 232.3,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "142",
"orig": "142",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 256.9,
"t": 248.8,
"r": 264.6,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 253.2,
"r_x1": 264.6,
"r_y1": 253.2,
"r_x2": 264.6,
"r_y2": 248.8,
"r_x3": 256.9,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "223",
"orig": "223",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 83,
"label": "text",
"bbox": {
"l": 281.5,
"t": 248.8,
"r": 289.2,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 253.2,
"r_x1": 289.2,
"r_y1": 253.2,
"r_x2": 289.2,
"r_y2": 248.8,
"r_x3": 281.5,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 55.5,
"t": 257.3,
"r": 91.8,
"b": 261.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 261.5,
"r_x1": 91.8,
"r_y1": 261.5,
"r_x2": 91.8,
"r_y2": 257.3,
"r_x3": 55.5,
"r_y3": 257.3,
"coord_origin": "TOPLEFT"
},
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 88.1,
"t": 257.1,
"r": 93.2,
"b": 261.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.1,
"r_y0": 261.4,
"r_x1": 93.2,
"r_y1": 261.4,
"r_x2": 93.2,
"r_y2": 257.1,
"r_x3": 88.1,
"r_y3": 257.1,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 93.2,
"t": 257.3,
"r": 119.1,
"b": 261.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.2,
"r_y0": 261.5,
"r_x1": 119.1,
"r_y1": 261.5,
"r_x2": 119.1,
"r_y2": 257.3,
"r_x3": 93.2,
"r_y3": 257.3,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 116.5,
"t": 257.1,
"r": 129.9,
"b": 261.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.5,
"r_y0": 261.4,
"r_x1": 129.9,
"r_y1": 261.4,
"r_x2": 129.9,
"r_y2": 257.1,
"r_x3": 116.5,
"r_y3": 257.1,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 183.1,
"t": 256.3,
"r": 190.9,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 260.7,
"r_x1": 190.9,
"r_y1": 260.7,
"r_x2": 190.9,
"r_y2": 256.3,
"r_x3": 183.1,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "177",
"orig": "177",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 210.3,
"t": 256.3,
"r": 212.9,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 260.7,
"r_x1": 212.9,
"r_y1": 260.7,
"r_x2": 212.9,
"r_y2": 256.3,
"r_x3": 210.3,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 232.3,
"t": 256.3,
"r": 240.0,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 260.7,
"r_x1": 240.0,
"r_y1": 260.7,
"r_x2": 240.0,
"r_y2": 256.3,
"r_x3": 232.3,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "176",
"orig": "176",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 256.9,
"t": 256.3,
"r": 264.6,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 260.7,
"r_x1": 264.6,
"r_y1": 260.7,
"r_x2": 264.6,
"r_y2": 256.3,
"r_x3": 256.9,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 281.5,
"t": 256.3,
"r": 289.2,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 260.7,
"r_x1": 289.2,
"r_y1": 260.7,
"r_x2": 289.2,
"r_y2": 256.3,
"r_x3": 281.5,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "236",
"orig": "236",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 55.5,
"t": 264.5,
"r": 60.7,
"b": 268.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 268.7,
"r_x1": 60.7,
"r_y1": 268.7,
"r_x2": 60.7,
"r_y2": 264.5,
"r_x3": 55.5,
"r_y3": 264.5,
"coord_origin": "TOPLEFT"
},
"text": "\u7b2c",
"orig": "\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 60.2,
"t": 264.3,
"r": 65.3,
"b": 268.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.2,
"r_y0": 268.7,
"r_x1": 65.3,
"r_y1": 268.7,
"r_x2": 65.3,
"r_y2": 264.3,
"r_x3": 60.2,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 65.3,
"t": 264.5,
"r": 122.4,
"b": 268.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.3,
"r_y0": 268.7,
"r_x1": 122.4,
"r_y1": 268.7,
"r_x2": 122.4,
"r_y2": 264.5,
"r_x3": 65.3,
"r_y3": 264.5,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 116.5,
"t": 264.3,
"r": 129.9,
"b": 268.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.5,
"r_y0": 268.7,
"r_x1": 129.9,
"r_y1": 268.7,
"r_x2": 129.9,
"r_y2": 264.3,
"r_x3": 116.5,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 183.1,
"t": 263.5,
"r": 190.9,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 267.9,
"r_x1": 190.9,
"r_y1": 267.9,
"r_x2": 190.9,
"r_y2": 263.5,
"r_x3": 183.1,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "208",
"orig": "208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 210.3,
"t": 263.5,
"r": 212.9,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 267.9,
"r_x1": 212.9,
"r_y1": 267.9,
"r_x2": 212.9,
"r_y2": 263.5,
"r_x3": 210.3,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 99,
"label": "text",
"bbox": {
"l": 232.3,
"t": 263.5,
"r": 240.0,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 267.9,
"r_x1": 240.0,
"r_y1": 267.9,
"r_x2": 240.0,
"r_y2": 263.5,
"r_x3": 232.3,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "203",
"orig": "203",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 256.9,
"t": 263.5,
"r": 264.6,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 267.9,
"r_x1": 264.6,
"r_y1": 267.9,
"r_x2": 264.6,
"r_y2": 263.5,
"r_x3": 256.9,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "152",
"orig": "152",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 281.5,
"t": 263.5,
"r": 289.2,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 267.9,
"r_x1": 289.2,
"r_y1": 267.9,
"r_x2": 289.2,
"r_y2": 263.5,
"r_x3": 281.5,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "244",
"orig": "244",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 55.5,
"t": 271.7,
"r": 107.4,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 275.9,
"r_x1": 107.4,
"r_y1": 275.9,
"r_x2": 107.4,
"r_y2": 271.7,
"r_x3": 55.5,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 102.0,
"t": 271.5,
"r": 109.7,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 102.0,
"r_y0": 275.9,
"r_x1": 109.7,
"r_y1": 275.9,
"r_x2": 109.7,
"r_y2": 271.5,
"r_x3": 102.0,
"r_y3": 271.5,
"coord_origin": "TOPLEFT"
},
"text": "146",
"orig": "146",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 109.7,
"t": 271.7,
"r": 114.9,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 109.7,
"r_y0": 275.9,
"r_x1": 114.9,
"r_y1": 275.9,
"r_x2": 114.9,
"r_y2": 271.7,
"r_x3": 109.7,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u301c",
"orig": "\u301c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 105,
"label": "text",
"bbox": {
"l": 114.4,
"t": 271.5,
"r": 122.1,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 114.4,
"r_y0": 275.9,
"r_x1": 122.1,
"r_y1": 275.9,
"r_x2": 122.1,
"r_y2": 271.5,
"r_x3": 114.4,
"r_y3": 271.5,
"coord_origin": "TOPLEFT"
},
"text": "155",
"orig": "155",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 106,
"label": "text",
"bbox": {
"l": 122.1,
"t": 271.7,
"r": 127.3,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.1,
"r_y0": 275.9,
"r_x1": 127.3,
"r_y1": 275.9,
"r_x2": 127.3,
"r_y2": 271.7,
"r_x3": 122.1,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u56de",
"orig": "\u56de",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 107,
"label": "text",
"bbox": {
"l": 184.4,
"t": 270.8,
"r": 189.6,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 275.1,
"r_x1": 189.6,
"r_y1": 275.1,
"r_x2": 189.6,
"r_y2": 270.8,
"r_x3": 184.4,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "98",
"orig": "98",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 108,
"label": "text",
"bbox": {
"l": 210.3,
"t": 270.8,
"r": 212.9,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 275.1,
"r_x1": 212.9,
"r_y1": 275.1,
"r_x2": 212.9,
"r_y2": 270.8,
"r_x3": 210.3,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 109,
"label": "text",
"bbox": {
"l": 233.6,
"t": 270.8,
"r": 238.8,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.6,
"r_y0": 275.1,
"r_x1": 238.8,
"r_y1": 275.1,
"r_x2": 238.8,
"r_y2": 270.8,
"r_x3": 233.6,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 110,
"label": "text",
"bbox": {
"l": 256.9,
"t": 270.8,
"r": 264.6,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 275.1,
"r_x1": 264.6,
"r_y1": 275.1,
"r_x2": 264.6,
"r_y2": 270.8,
"r_x3": 256.9,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 111,
"label": "text",
"bbox": {
"l": 281.5,
"t": 270.8,
"r": 289.2,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 275.1,
"r_x1": 289.2,
"r_y1": 275.1,
"r_x2": 289.2,
"r_y2": 270.8,
"r_x3": 281.5,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "232",
"orig": "232",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 112,
"label": "text",
"bbox": {
"l": 55.5,
"t": 279.0,
"r": 68.7,
"b": 283.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 283.4,
"r_x1": 68.7,
"r_y1": 283.4,
"r_x2": 68.7,
"r_y2": 279.0,
"r_x3": 55.5,
"r_y3": 279.0,
"coord_origin": "TOPLEFT"
},
"text": "WWW",
"orig": "WWW",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 113,
"label": "text",
"bbox": {
"l": 68.7,
"t": 279.2,
"r": 110.2,
"b": 283.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.7,
"r_y0": 283.4,
"r_x1": 110.2,
"r_y1": 283.4,
"r_x2": 110.2,
"r_y2": 279.2,
"r_x3": 68.7,
"r_y3": 279.2,
"coord_origin": "TOPLEFT"
},
"text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 114,
"label": "text",
"bbox": {
"l": 183.1,
"t": 278.0,
"r": 190.9,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 282.3,
"r_x1": 190.9,
"r_y1": 282.3,
"r_x2": 190.9,
"r_y2": 278.0,
"r_x3": 183.1,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "107",
"orig": "107",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 115,
"label": "text",
"bbox": {
"l": 209.0,
"t": 278.0,
"r": 214.2,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 282.3,
"r_x1": 214.2,
"r_y1": 282.3,
"r_x2": 214.2,
"r_y2": 278.0,
"r_x3": 209.0,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "73",
"orig": "73",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 116,
"label": "text",
"bbox": {
"l": 233.6,
"t": 278.0,
"r": 238.8,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.6,
"r_y0": 282.3,
"r_x1": 238.8,
"r_y1": 282.3,
"r_x2": 238.8,
"r_y2": 278.0,
"r_x3": 233.6,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 117,
"label": "text",
"bbox": {
"l": 256.9,
"t": 278.0,
"r": 264.6,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 282.3,
"r_x1": 264.6,
"r_y1": 282.3,
"r_x2": 264.6,
"r_y2": 278.0,
"r_x3": 256.9,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 118,
"label": "text",
"bbox": {
"l": 282.8,
"t": 278.0,
"r": 287.9,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 282.8,
"r_y0": 282.3,
"r_x1": 287.9,
"r_y1": 282.3,
"r_x2": 287.9,
"r_y2": 278.0,
"r_x3": 282.8,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 119,
"label": "text",
"bbox": {
"l": 169.6,
"t": 286.5,
"r": 174.8,
"b": 290.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 169.6,
"r_y0": 290.6,
"r_x1": 174.8,
"r_y1": 290.6,
"r_x2": 174.8,
"r_y2": 286.5,
"r_x3": 169.6,
"r_y3": 286.5,
"coord_origin": "TOPLEFT"
},
"text": "\u8a08",
"orig": "\u8a08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 120,
"label": "text",
"bbox": {
"l": 183.1,
"t": 285.5,
"r": 190.9,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 289.8,
"r_x1": 190.9,
"r_y1": 289.8,
"r_x2": 190.9,
"r_y2": 285.5,
"r_x3": 183.1,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "945",
"orig": "945",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 121,
"label": "text",
"bbox": {
"l": 207.7,
"t": 285.5,
"r": 215.4,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 289.8,
"r_x1": 215.4,
"r_y1": 289.8,
"r_x2": 215.4,
"r_y2": 285.5,
"r_x3": 207.7,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "294",
"orig": "294",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 122,
"label": "text",
"bbox": {
"l": 232.3,
"t": 285.5,
"r": 240.0,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 289.8,
"r_x1": 240.0,
"r_y1": 289.8,
"r_x2": 240.0,
"r_y2": 285.5,
"r_x3": 232.3,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "651",
"orig": "651",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 123,
"label": "text",
"bbox": {
"l": 255.8,
"t": 285.5,
"r": 265.8,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.8,
"r_y0": 289.8,
"r_x1": 265.8,
"r_y1": 289.8,
"r_x2": 265.8,
"r_y2": 285.5,
"r_x3": 255.8,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "1122",
"orig": "1122",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 124,
"label": "text",
"bbox": {
"l": 281.5,
"t": 285.5,
"r": 289.2,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 289.8,
"r_x1": 289.2,
"r_y1": 289.8,
"r_x2": 289.2,
"r_y2": 285.5,
"r_x3": 281.5,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "955",
"orig": "955",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"lcel",
"ched",
"lcel",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 10,
"num_cols": 6,
"table_cells": [
{
"bbox": {
"l": 209.9,
"t": 222.2,
"r": 241.0,
"b": 226.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 4,
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 263.8,
"t": 222.2,
"r": 284.5,
"b": 226.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 4,
"end_col_offset_idx": 6,
"text": "\u53c2\u8003\u6587\u732e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 110.2,
"t": 229.7,
"r": 120.6,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u51fa\u5178",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 175.4,
"t": 229.7,
"r": 196.1,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "\u30d5\u30a1\u30a4\u30eb \u6570",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 209.6,
"t": 229.7,
"r": 220.0,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "\u82f1\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 229.2,
"t": 229.7,
"r": 244.8,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "\u65e5\u672c\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.1,
"t": 229.7,
"r": 266.5,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "\u82f1\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 278.4,
"t": 229.7,
"r": 293.9,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "\u65e5\u672c\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.5,
"t": 236.4,
"r": 162.7,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Association for Computational Linguistics(ACL2003)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 184.4,
"t": 236.4,
"r": 189.6,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "65",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 209.0,
"t": 236.4,
"r": 214.2,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "65",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 234.9,
"t": 236.4,
"r": 237.5,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.9,
"t": 236.4,
"r": 264.6,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 284.1,
"t": 236.4,
"r": 286.6,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.5,
"t": 242.6,
"r": 139.7,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Computational Linguistics(COLING2002)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.1,
"t": 242.6,
"r": 190.9,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "140",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 207.7,
"t": 242.6,
"r": 215.4,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "140",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 234.9,
"t": 242.6,
"r": 237.5,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.9,
"t": 242.6,
"r": 264.6,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 284.1,
"t": 242.6,
"r": 286.6,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.5,
"t": 249.8,
"r": 97.0,
"b": 254.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a 2003 \u5e74\u7dcf\u5408\u5927\u4f1a",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.1,
"t": 248.8,
"r": 190.9,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.3,
"t": 248.8,
"r": 212.9,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.3,
"t": 248.8,
"r": 240.0,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "142",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.9,
"t": 248.8,
"r": 264.6,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "223",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.5,
"t": 248.8,
"r": 289.2,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "147",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.5,
"t": 257.3,
"r": 91.8,
"b": 261.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c 65 \u56de\u5168\u56fd\u5927\u4f1a (2003)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.1,
"t": 256.3,
"r": 190.9,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "177",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.3,
"t": 256.3,
"r": 212.9,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.3,
"t": 256.3,
"r": 240.0,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "176",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.9,
"t": 256.3,
"r": 264.6,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.5,
"t": 256.3,
"r": 289.2,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "236",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.5,
"t": 264.5,
"r": 60.7,
"b": 268.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u7b2c 17 \u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a (2003)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.1,
"t": 263.5,
"r": 190.9,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "208",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.3,
"t": 263.5,
"r": 212.9,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.3,
"t": 263.5,
"r": 240.0,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "203",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.9,
"t": 263.5,
"r": 264.6,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "152",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.5,
"t": 263.5,
"r": 289.2,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "244",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.5,
"t": 271.7,
"r": 107.4,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c 146 \u301c 155 \u56de",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 184.4,
"t": 270.8,
"r": 189.6,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "98",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.3,
"t": 270.8,
"r": 212.9,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 233.6,
"t": 270.8,
"r": 238.8,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "96",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.9,
"t": 270.8,
"r": 264.6,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.5,
"t": 270.8,
"r": 289.2,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "232",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.5,
"t": 279.0,
"r": 68.7,
"b": 283.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "WWW \u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.1,
"t": 278.0,
"r": 190.9,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "107",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 209.0,
"t": 278.0,
"r": 214.2,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "73",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 233.6,
"t": 278.0,
"r": 238.8,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "34",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.9,
"t": 278.0,
"r": 264.6,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "147",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 282.8,
"t": 278.0,
"r": 287.9,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "96",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 169.6,
"t": 286.5,
"r": 174.8,
"b": 290.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u8a08",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.1,
"t": 285.5,
"r": 190.9,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "945",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 207.7,
"t": 285.5,
"r": 215.4,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "294",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.3,
"t": 285.5,
"r": 240.0,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "651",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 255.8,
"t": 285.5,
"r": 265.8,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "1122",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.5,
"t": 285.5,
"r": 289.2,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "955",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 16,
"page_no": 7,
"cluster": {
"id": 16,
"label": "caption",
"bbox": {
"l": 380.4,
"t": 292.3,
"r": 549.4,
"b": 298.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.75,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 380.4,
"r_y0": 298.6,
"r_x1": 549.4,
"r_y1": 298.6,
"r_x2": 549.4,
"r_y2": 292.3,
"r_x3": 380.4,
"r_y3": 292.3,
"coord_origin": "TOPLEFT"
},
"text": "Text is aligned to match original for ease of viewing",
"orig": "Text is aligned to match original for ease of viewing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Text is aligned to match original for ease of viewing"
},
{
"label": "table",
"id": 7,
"page_no": 7,
"cluster": {
"id": 7,
"label": "table",
"bbox": {
"l": 304.9,
"t": 218.5,
"r": 550.2,
"b": 287.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.0,
"r_y0": 226.7,
"r_x1": 542.0,
"r_y1": 226.7,
"r_x2": 542.0,
"r_y2": 221.6,
"r_x3": 459.0,
"r_y3": 221.6,
"coord_origin": "TOPLEFT"
},
"text": "Weighted Average Grant Date Fair",
"orig": "Weighted Average Grant Date Fair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.8,
"r_y0": 232.9,
"r_x1": 507.2,
"r_y1": 232.9,
"r_x2": 507.2,
"r_y2": 227.8,
"r_x3": 493.8,
"r_y3": 227.8,
"coord_origin": "TOPLEFT"
},
"text": "Value",
"orig": "Value",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.2,
"r_y0": 241.8,
"r_x1": 400.7,
"r_y1": 241.8,
"r_x2": 400.7,
"r_y2": 236.7,
"r_x3": 393.2,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "RS",
"orig": "RS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 241.8,
"r_x1": 404.6,
"r_y1": 241.8,
"r_x2": 404.6,
"r_y2": 236.7,
"r_x3": 400.7,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "U",
"orig": "U",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 404.6,
"r_y0": 241.8,
"r_x1": 407.3,
"r_y1": 241.8,
"r_x2": 407.3,
"r_y2": 236.7,
"r_x3": 404.6,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "s",
"orig": "s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 392.1,
"r_y0": 226.6,
"r_x1": 438.0,
"r_y1": 226.6,
"r_x2": 438.0,
"r_y2": 221.6,
"r_x3": 392.1,
"r_y3": 221.6,
"coord_origin": "TOPLEFT"
},
"text": "Shares (in millions)",
"orig": "Shares (in millions)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.2,
"r_y0": 241.8,
"r_x1": 441.0,
"r_y1": 241.8,
"r_x2": 441.0,
"r_y2": 236.7,
"r_x3": 427.2,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.4,
"r_y0": 241.8,
"r_x1": 482.5,
"r_y1": 241.8,
"r_x2": 482.5,
"r_y2": 236.7,
"r_x3": 468.4,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "RSUs",
"orig": "RSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.9,
"r_y0": 241.8,
"r_x1": 530.7,
"r_y1": 241.8,
"r_x2": 530.7,
"r_y2": 236.7,
"r_x3": 516.9,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 249.7,
"r_x1": 355.7,
"r_y1": 249.7,
"r_x2": 355.7,
"r_y2": 244.6,
"r_x3": 306.1,
"r_y3": 244.6,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on Janua",
"orig": "Nonvested on Janua",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 355.7,
"r_y0": 249.7,
"r_x1": 364.7,
"r_y1": 249.7,
"r_x2": 364.7,
"r_y2": 244.6,
"r_x3": 355.7,
"r_y3": 244.6,
"coord_origin": "TOPLEFT"
},
"text": "ry 1",
"orig": "ry 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 250.0,
"r_x1": 400.8,
"r_y1": 250.0,
"r_x2": 400.8,
"r_y2": 244.9,
"r_x3": 396.2,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.8,
"r_y0": 250.0,
"r_x1": 403.8,
"r_y1": 250.0,
"r_x2": 403.8,
"r_y2": 244.9,
"r_x3": 400.8,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.8,
"r_y0": 250.0,
"r_x1": 437.3,
"r_y1": 250.0,
"r_x2": 437.3,
"r_y2": 244.9,
"r_x3": 429.8,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.5,
"r_y0": 250.0,
"r_x1": 478.4,
"r_y1": 250.0,
"r_x2": 478.4,
"r_y2": 244.9,
"r_x3": 465.5,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "90.10",
"orig": "90.10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 481.0,
"r_y0": 250.0,
"r_x1": 483.6,
"r_y1": 250.0,
"r_x2": 483.6,
"r_y2": 244.9,
"r_x3": 481.0,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "$",
"orig": "$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.4,
"r_y0": 250.0,
"r_x1": 531.5,
"r_y1": 250.0,
"r_x2": 531.5,
"r_y2": 244.9,
"r_x3": 513.4,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "$ 91.19",
"orig": "$ 91.19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 258.7,
"r_x1": 325.6,
"r_y1": 258.7,
"r_x2": 325.6,
"r_y2": 253.7,
"r_x3": 306.1,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Granted",
"orig": "Granted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 258.7,
"r_x1": 400.8,
"r_y1": 258.7,
"r_x2": 400.8,
"r_y2": 253.7,
"r_x3": 396.2,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "0.",
"orig": "0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.8,
"r_y0": 258.7,
"r_x1": 403.8,
"r_y1": 258.7,
"r_x2": 403.8,
"r_y2": 253.7,
"r_x3": 400.8,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.8,
"r_y0": 258.7,
"r_x1": 437.3,
"r_y1": 258.7,
"r_x2": 437.3,
"r_y2": 253.7,
"r_x3": 429.8,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "0.1",
"orig": "0.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.4,
"r_y0": 258.7,
"r_x1": 482.5,
"r_y1": 258.7,
"r_x2": 482.5,
"r_y2": 253.7,
"r_x3": 466.4,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "117.44",
"orig": "117.44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.3,
"r_y0": 258.7,
"r_x1": 530.8,
"r_y1": 258.7,
"r_x2": 530.8,
"r_y2": 253.7,
"r_x3": 514.3,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "122.41",
"orig": "122.41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 266.6,
"r_x1": 322.6,
"r_y1": 266.6,
"r_x2": 322.6,
"r_y2": 261.5,
"r_x3": 306.1,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "Vested",
"orig": "Vested",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.4,
"r_y0": 266.6,
"r_x1": 400.7,
"r_y1": 266.6,
"r_x2": 400.7,
"r_y2": 261.5,
"r_x3": 394.4,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 266.6,
"r_x1": 403.7,
"r_y1": 266.6,
"r_x2": 403.7,
"r_y2": 261.5,
"r_x3": 400.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.7,
"r_y0": 266.6,
"r_x1": 405.5,
"r_y1": 266.6,
"r_x2": 405.5,
"r_y2": 261.5,
"r_x3": 403.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.7,
"r_y0": 266.6,
"r_x1": 438.8,
"r_y1": 266.6,
"r_x2": 438.8,
"r_y2": 261.5,
"r_x3": 427.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "(0.1)",
"orig": "(0.1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.6,
"r_y0": 266.6,
"r_x1": 482.1,
"r_y1": 266.6,
"r_x2": 482.1,
"r_y2": 261.5,
"r_x3": 468.6,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "87.08",
"orig": "87.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.0,
"r_y0": 266.6,
"r_x1": 529.5,
"r_y1": 266.6,
"r_x2": 529.5,
"r_y2": 261.5,
"r_x3": 516.0,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "81.14",
"orig": "81.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 274.7,
"r_x1": 356.2,
"r_y1": 274.7,
"r_x2": 356.2,
"r_y2": 269.6,
"r_x3": 306.1,
"r_y3": 269.6,
"coord_origin": "TOPLEFT"
},
"text": "Canceled or forfeited",
"orig": "Canceled or forfeited",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.4,
"r_y0": 275.4,
"r_x1": 400.7,
"r_y1": 275.4,
"r_x2": 400.7,
"r_y2": 270.3,
"r_x3": 394.4,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 275.4,
"r_x1": 403.7,
"r_y1": 275.4,
"r_x2": 403.7,
"r_y2": 270.3,
"r_x3": 400.7,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.7,
"r_y0": 275.4,
"r_x1": 405.5,
"r_y1": 275.4,
"r_x2": 405.5,
"r_y2": 270.3,
"r_x3": 403.7,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.0,
"r_y0": 275.4,
"r_x1": 436.4,
"r_y1": 275.4,
"r_x2": 436.4,
"r_y2": 270.3,
"r_x3": 431.0,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.8,
"r_y0": 275.4,
"r_x1": 482.4,
"r_y1": 275.4,
"r_x2": 482.4,
"r_y2": 270.3,
"r_x3": 465.8,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "102.01",
"orig": "102.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.0,
"r_y0": 275.4,
"r_x1": 529.5,
"r_y1": 275.4,
"r_x2": 529.5,
"r_y2": 270.3,
"r_x3": 516.0,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "92.18",
"orig": "92.18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 283.6,
"r_x1": 373.4,
"r_y1": 283.6,
"r_x2": 373.4,
"r_y2": 278.5,
"r_x3": 306.1,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on December 31",
"orig": "Nonvested on December 31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 283.6,
"r_x1": 403.8,
"r_y1": 283.6,
"r_x2": 403.8,
"r_y2": 278.5,
"r_x3": 396.2,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "1.0",
"orig": "1.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.5,
"r_y0": 283.6,
"r_x1": 437.0,
"r_y1": 283.6,
"r_x2": 437.0,
"r_y2": 278.5,
"r_x3": 429.5,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.7,
"r_y0": 283.6,
"r_x1": 484.7,
"r_y1": 283.6,
"r_x2": 484.7,
"r_y2": 278.5,
"r_x3": 463.7,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "104.85 $",
"orig": "104.85 $",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.0,
"r_y0": 283.6,
"r_x1": 534.0,
"r_y1": 283.6,
"r_x2": 534.0,
"r_y2": 278.5,
"r_x3": 513.0,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "$ 104.51",
"orig": "$ 104.51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 125,
"label": "text",
"bbox": {
"l": 459.0,
"t": 221.6,
"r": 542.0,
"b": 226.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.0,
"r_y0": 226.7,
"r_x1": 542.0,
"r_y1": 226.7,
"r_x2": 542.0,
"r_y2": 221.6,
"r_x3": 459.0,
"r_y3": 221.6,
"coord_origin": "TOPLEFT"
},
"text": "Weighted Average Grant Date Fair",
"orig": "Weighted Average Grant Date Fair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 126,
"label": "text",
"bbox": {
"l": 493.8,
"t": 227.8,
"r": 507.2,
"b": 232.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.8,
"r_y0": 232.9,
"r_x1": 507.2,
"r_y1": 232.9,
"r_x2": 507.2,
"r_y2": 227.8,
"r_x3": 493.8,
"r_y3": 227.8,
"coord_origin": "TOPLEFT"
},
"text": "Value",
"orig": "Value",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 127,
"label": "text",
"bbox": {
"l": 393.2,
"t": 236.7,
"r": 400.7,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.2,
"r_y0": 241.8,
"r_x1": 400.7,
"r_y1": 241.8,
"r_x2": 400.7,
"r_y2": 236.7,
"r_x3": 393.2,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "RS",
"orig": "RS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 128,
"label": "text",
"bbox": {
"l": 400.7,
"t": 236.7,
"r": 404.6,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 241.8,
"r_x1": 404.6,
"r_y1": 241.8,
"r_x2": 404.6,
"r_y2": 236.7,
"r_x3": 400.7,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "U",
"orig": "U",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 129,
"label": "text",
"bbox": {
"l": 404.6,
"t": 236.7,
"r": 407.3,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 404.6,
"r_y0": 241.8,
"r_x1": 407.3,
"r_y1": 241.8,
"r_x2": 407.3,
"r_y2": 236.7,
"r_x3": 404.6,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "s",
"orig": "s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 130,
"label": "text",
"bbox": {
"l": 392.1,
"t": 221.6,
"r": 438.0,
"b": 226.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 392.1,
"r_y0": 226.6,
"r_x1": 438.0,
"r_y1": 226.6,
"r_x2": 438.0,
"r_y2": 221.6,
"r_x3": 392.1,
"r_y3": 221.6,
"coord_origin": "TOPLEFT"
},
"text": "Shares (in millions)",
"orig": "Shares (in millions)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 131,
"label": "text",
"bbox": {
"l": 427.2,
"t": 236.7,
"r": 441.0,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.2,
"r_y0": 241.8,
"r_x1": 441.0,
"r_y1": 241.8,
"r_x2": 441.0,
"r_y2": 236.7,
"r_x3": 427.2,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 132,
"label": "text",
"bbox": {
"l": 468.4,
"t": 236.7,
"r": 482.5,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.4,
"r_y0": 241.8,
"r_x1": 482.5,
"r_y1": 241.8,
"r_x2": 482.5,
"r_y2": 236.7,
"r_x3": 468.4,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "RSUs",
"orig": "RSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 133,
"label": "text",
"bbox": {
"l": 516.9,
"t": 236.7,
"r": 530.7,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.9,
"r_y0": 241.8,
"r_x1": 530.7,
"r_y1": 241.8,
"r_x2": 530.7,
"r_y2": 236.7,
"r_x3": 516.9,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 134,
"label": "text",
"bbox": {
"l": 306.1,
"t": 244.6,
"r": 355.7,
"b": 249.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 249.7,
"r_x1": 355.7,
"r_y1": 249.7,
"r_x2": 355.7,
"r_y2": 244.6,
"r_x3": 306.1,
"r_y3": 244.6,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on Janua",
"orig": "Nonvested on Janua",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 135,
"label": "text",
"bbox": {
"l": 355.7,
"t": 244.6,
"r": 364.7,
"b": 249.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 355.7,
"r_y0": 249.7,
"r_x1": 364.7,
"r_y1": 249.7,
"r_x2": 364.7,
"r_y2": 244.6,
"r_x3": 355.7,
"r_y3": 244.6,
"coord_origin": "TOPLEFT"
},
"text": "ry 1",
"orig": "ry 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 136,
"label": "text",
"bbox": {
"l": 396.2,
"t": 244.9,
"r": 400.8,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 250.0,
"r_x1": 400.8,
"r_y1": 250.0,
"r_x2": 400.8,
"r_y2": 244.9,
"r_x3": 396.2,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 137,
"label": "text",
"bbox": {
"l": 400.8,
"t": 244.9,
"r": 403.8,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.8,
"r_y0": 250.0,
"r_x1": 403.8,
"r_y1": 250.0,
"r_x2": 403.8,
"r_y2": 244.9,
"r_x3": 400.8,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 138,
"label": "text",
"bbox": {
"l": 429.8,
"t": 244.9,
"r": 437.3,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.8,
"r_y0": 250.0,
"r_x1": 437.3,
"r_y1": 250.0,
"r_x2": 437.3,
"r_y2": 244.9,
"r_x3": 429.8,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 139,
"label": "text",
"bbox": {
"l": 465.5,
"t": 244.9,
"r": 478.4,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.5,
"r_y0": 250.0,
"r_x1": 478.4,
"r_y1": 250.0,
"r_x2": 478.4,
"r_y2": 244.9,
"r_x3": 465.5,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "90.10",
"orig": "90.10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 140,
"label": "text",
"bbox": {
"l": 481.0,
"t": 244.9,
"r": 483.6,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 481.0,
"r_y0": 250.0,
"r_x1": 483.6,
"r_y1": 250.0,
"r_x2": 483.6,
"r_y2": 244.9,
"r_x3": 481.0,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "$",
"orig": "$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 141,
"label": "text",
"bbox": {
"l": 513.4,
"t": 244.9,
"r": 531.5,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.4,
"r_y0": 250.0,
"r_x1": 531.5,
"r_y1": 250.0,
"r_x2": 531.5,
"r_y2": 244.9,
"r_x3": 513.4,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "$ 91.19",
"orig": "$ 91.19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 142,
"label": "text",
"bbox": {
"l": 306.1,
"t": 253.7,
"r": 325.6,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 258.7,
"r_x1": 325.6,
"r_y1": 258.7,
"r_x2": 325.6,
"r_y2": 253.7,
"r_x3": 306.1,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Granted",
"orig": "Granted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 143,
"label": "text",
"bbox": {
"l": 396.2,
"t": 253.7,
"r": 400.8,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 258.7,
"r_x1": 400.8,
"r_y1": 258.7,
"r_x2": 400.8,
"r_y2": 253.7,
"r_x3": 396.2,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "0.",
"orig": "0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 144,
"label": "text",
"bbox": {
"l": 400.8,
"t": 253.7,
"r": 403.8,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.8,
"r_y0": 258.7,
"r_x1": 403.8,
"r_y1": 258.7,
"r_x2": 403.8,
"r_y2": 253.7,
"r_x3": 400.8,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 145,
"label": "text",
"bbox": {
"l": 429.8,
"t": 253.7,
"r": 437.3,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.8,
"r_y0": 258.7,
"r_x1": 437.3,
"r_y1": 258.7,
"r_x2": 437.3,
"r_y2": 253.7,
"r_x3": 429.8,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "0.1",
"orig": "0.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 146,
"label": "text",
"bbox": {
"l": 466.4,
"t": 253.7,
"r": 482.5,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.4,
"r_y0": 258.7,
"r_x1": 482.5,
"r_y1": 258.7,
"r_x2": 482.5,
"r_y2": 253.7,
"r_x3": 466.4,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "117.44",
"orig": "117.44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 147,
"label": "text",
"bbox": {
"l": 514.3,
"t": 253.7,
"r": 530.8,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.3,
"r_y0": 258.7,
"r_x1": 530.8,
"r_y1": 258.7,
"r_x2": 530.8,
"r_y2": 253.7,
"r_x3": 514.3,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "122.41",
"orig": "122.41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 148,
"label": "text",
"bbox": {
"l": 306.1,
"t": 261.5,
"r": 322.6,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 266.6,
"r_x1": 322.6,
"r_y1": 266.6,
"r_x2": 322.6,
"r_y2": 261.5,
"r_x3": 306.1,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "Vested",
"orig": "Vested",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 149,
"label": "text",
"bbox": {
"l": 394.4,
"t": 261.5,
"r": 400.7,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.4,
"r_y0": 266.6,
"r_x1": 400.7,
"r_y1": 266.6,
"r_x2": 400.7,
"r_y2": 261.5,
"r_x3": 394.4,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 150,
"label": "text",
"bbox": {
"l": 400.7,
"t": 261.5,
"r": 403.7,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 266.6,
"r_x1": 403.7,
"r_y1": 266.6,
"r_x2": 403.7,
"r_y2": 261.5,
"r_x3": 400.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 151,
"label": "text",
"bbox": {
"l": 403.7,
"t": 261.5,
"r": 405.5,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.7,
"r_y0": 266.6,
"r_x1": 405.5,
"r_y1": 266.6,
"r_x2": 405.5,
"r_y2": 261.5,
"r_x3": 403.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 152,
"label": "text",
"bbox": {
"l": 427.7,
"t": 261.5,
"r": 438.8,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.7,
"r_y0": 266.6,
"r_x1": 438.8,
"r_y1": 266.6,
"r_x2": 438.8,
"r_y2": 261.5,
"r_x3": 427.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "(0.1)",
"orig": "(0.1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 153,
"label": "text",
"bbox": {
"l": 468.6,
"t": 261.5,
"r": 482.1,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.6,
"r_y0": 266.6,
"r_x1": 482.1,
"r_y1": 266.6,
"r_x2": 482.1,
"r_y2": 261.5,
"r_x3": 468.6,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "87.08",
"orig": "87.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 154,
"label": "text",
"bbox": {
"l": 516.0,
"t": 261.5,
"r": 529.5,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.0,
"r_y0": 266.6,
"r_x1": 529.5,
"r_y1": 266.6,
"r_x2": 529.5,
"r_y2": 261.5,
"r_x3": 516.0,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "81.14",
"orig": "81.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 155,
"label": "text",
"bbox": {
"l": 306.1,
"t": 269.6,
"r": 356.2,
"b": 274.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 274.7,
"r_x1": 356.2,
"r_y1": 274.7,
"r_x2": 356.2,
"r_y2": 269.6,
"r_x3": 306.1,
"r_y3": 269.6,
"coord_origin": "TOPLEFT"
},
"text": "Canceled or forfeited",
"orig": "Canceled or forfeited",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 156,
"label": "text",
"bbox": {
"l": 394.4,
"t": 270.3,
"r": 400.7,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.4,
"r_y0": 275.4,
"r_x1": 400.7,
"r_y1": 275.4,
"r_x2": 400.7,
"r_y2": 270.3,
"r_x3": 394.4,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 157,
"label": "text",
"bbox": {
"l": 400.7,
"t": 270.3,
"r": 403.7,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 275.4,
"r_x1": 403.7,
"r_y1": 275.4,
"r_x2": 403.7,
"r_y2": 270.3,
"r_x3": 400.7,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 158,
"label": "text",
"bbox": {
"l": 403.7,
"t": 270.3,
"r": 405.5,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.7,
"r_y0": 275.4,
"r_x1": 405.5,
"r_y1": 275.4,
"r_x2": 405.5,
"r_y2": 270.3,
"r_x3": 403.7,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 159,
"label": "text",
"bbox": {
"l": 431.0,
"t": 270.3,
"r": 436.4,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.0,
"r_y0": 275.4,
"r_x1": 436.4,
"r_y1": 275.4,
"r_x2": 436.4,
"r_y2": 270.3,
"r_x3": 431.0,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 160,
"label": "text",
"bbox": {
"l": 465.8,
"t": 270.3,
"r": 482.4,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.8,
"r_y0": 275.4,
"r_x1": 482.4,
"r_y1": 275.4,
"r_x2": 482.4,
"r_y2": 270.3,
"r_x3": 465.8,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "102.01",
"orig": "102.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 161,
"label": "text",
"bbox": {
"l": 516.0,
"t": 270.3,
"r": 529.5,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.0,
"r_y0": 275.4,
"r_x1": 529.5,
"r_y1": 275.4,
"r_x2": 529.5,
"r_y2": 270.3,
"r_x3": 516.0,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "92.18",
"orig": "92.18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 162,
"label": "text",
"bbox": {
"l": 306.1,
"t": 278.5,
"r": 373.4,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 283.6,
"r_x1": 373.4,
"r_y1": 283.6,
"r_x2": 373.4,
"r_y2": 278.5,
"r_x3": 306.1,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on December 31",
"orig": "Nonvested on December 31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 163,
"label": "text",
"bbox": {
"l": 396.2,
"t": 278.5,
"r": 403.8,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 283.6,
"r_x1": 403.8,
"r_y1": 283.6,
"r_x2": 403.8,
"r_y2": 278.5,
"r_x3": 396.2,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "1.0",
"orig": "1.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 164,
"label": "text",
"bbox": {
"l": 429.5,
"t": 278.5,
"r": 437.0,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.5,
"r_y0": 283.6,
"r_x1": 437.0,
"r_y1": 283.6,
"r_x2": 437.0,
"r_y2": 278.5,
"r_x3": 429.5,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 165,
"label": "text",
"bbox": {
"l": 463.7,
"t": 278.5,
"r": 484.7,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.7,
"r_y0": 283.6,
"r_x1": 484.7,
"r_y1": 283.6,
"r_x2": 484.7,
"r_y2": 278.5,
"r_x3": 463.7,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "104.85 $",
"orig": "104.85 $",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 166,
"label": "text",
"bbox": {
"l": 513.0,
"t": 278.5,
"r": 534.0,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.0,
"r_y0": 283.6,
"r_x1": 534.0,
"r_y1": 283.6,
"r_x2": 534.0,
"r_y2": 278.5,
"r_x3": 513.0,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "$ 104.51",
"orig": "$ 104.51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"lcel",
"ched",
"lcel",
"nl",
"ecel",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 7,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 459.0,
"t": 221.6,
"r": 542.0,
"b": 226.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 5,
"text": "Weighted Average Grant Date Fair Value",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 393.2,
"t": 236.7,
"r": 400.7,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "RS U s",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 392.1,
"t": 221.6,
"r": 438.0,
"b": 226.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 3,
"text": "Shares (in millions)",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 427.2,
"t": 236.7,
"r": 441.0,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "PSUs",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 468.4,
"t": 236.7,
"r": 482.5,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "RSUs",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 516.9,
"t": 236.7,
"r": 530.7,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PSUs",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.1,
"t": 244.6,
"r": 355.7,
"b": 249.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Nonvested on Janua ry 1",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 396.2,
"t": 244.9,
"r": 400.8,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "1. 1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 429.8,
"t": 244.9,
"r": 437.3,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "0.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 465.5,
"t": 244.9,
"r": 478.4,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "90.10 $",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 513.4,
"t": 244.9,
"r": 531.5,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "$ 91.19",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.1,
"t": 253.7,
"r": 325.6,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Granted",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 396.2,
"t": 253.7,
"r": 400.8,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "0. 5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 429.8,
"t": 253.7,
"r": 437.3,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "0.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 466.4,
"t": 253.7,
"r": 482.5,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "117.44",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 514.3,
"t": 253.7,
"r": 530.8,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "122.41",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.1,
"t": 261.5,
"r": 322.6,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Vested",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 394.4,
"t": 261.5,
"r": 400.7,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "(0. 5 )",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 427.7,
"t": 261.5,
"r": 438.8,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "(0.1)",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 468.6,
"t": 261.5,
"r": 482.1,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "87.08",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 516.0,
"t": 261.5,
"r": 529.5,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "81.14",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.1,
"t": 269.6,
"r": 356.2,
"b": 274.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Canceled or forfeited",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 394.4,
"t": 270.3,
"r": 400.7,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "(0. 1 )",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 431.0,
"t": 270.3,
"r": 436.4,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 465.8,
"t": 270.3,
"r": 482.4,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "102.01",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 516.0,
"t": 270.3,
"r": 529.5,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "92.18",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.1,
"t": 278.5,
"r": 373.4,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Nonvested on December 31",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 396.2,
"t": 278.5,
"r": 403.8,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "1.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 429.5,
"t": 278.5,
"r": 437.0,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "0.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 463.7,
"t": 278.5,
"r": 484.7,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "104.85 $",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 513.0,
"t": 278.5,
"r": 534.0,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "$ 104.51",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 6,
"page_no": 7,
"cluster": {
"id": 6,
"label": "caption",
"bbox": {
"l": 50.1,
"t": 320.9,
"r": 545.1,
"b": 365.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 329.8,
"r_x1": 86.9,
"r_y1": 329.8,
"r_x2": 86.9,
"r_y2": 320.9,
"r_x3": 50.1,
"r_y3": 320.9,
"coord_origin": "TOPLEFT"
},
"text": "Figure 5:",
"orig": "Figure 5:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.9,
"r_y0": 329.8,
"r_x1": 545.1,
"r_y1": 329.8,
"r_x2": 545.1,
"r_y2": 320.9,
"r_x3": 93.9,
"r_y3": 320.9,
"coord_origin": "TOPLEFT"
},
"text": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration",
"orig": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 341.7,
"r_x1": 545.1,
"r_y1": 341.7,
"r_x2": 545.1,
"r_y2": 332.8,
"r_x3": 50.1,
"r_y3": 332.8,
"coord_origin": "TOPLEFT"
},
"text": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is",
"orig": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 353.7,
"r_x1": 545.1,
"r_y1": 353.7,
"r_x2": 545.1,
"r_y2": 344.8,
"r_x3": 50.1,
"r_y3": 344.8,
"coord_origin": "TOPLEFT"
},
"text": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from",
"orig": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 365.6,
"r_x1": 139.8,
"r_y1": 365.6,
"r_x2": 139.8,
"r_y2": 356.7,
"r_x3": 50.1,
"r_y3": 356.7,
"coord_origin": "TOPLEFT"
},
"text": "the FinTabNet dataset.",
"orig": "the FinTabNet dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 5: One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from the FinTabNet dataset."
},
{
"label": "picture",
"id": 12,
"page_no": 7,
"cluster": {
"id": 12,
"label": "picture",
"bbox": {
"l": 216.8,
"t": 380.5,
"r": 375.8,
"b": 443.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.81,
"cells": [
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.3,
"r_y0": 386.4,
"r_x1": 342.1,
"r_y1": 386.4,
"r_x2": 342.1,
"r_y2": 381.8,
"r_x3": 220.3,
"r_y3": 381.8,
"coord_origin": "TOPLEFT"
},
"text": "Red - PDF cells, Green - predicted bounding boxes",
"orig": "Red - PDF cells, Green - predicted bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 167,
"label": "text",
"bbox": {
"l": 220.3,
"t": 381.8,
"r": 342.1,
"b": 386.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.3,
"r_y0": 386.4,
"r_x1": 342.1,
"r_y1": 386.4,
"r_x2": 342.1,
"r_y2": 381.8,
"r_x3": 220.3,
"r_y3": 381.8,
"coord_origin": "TOPLEFT"
},
"text": "Red - PDF cells, Green - predicted bounding boxes",
"orig": "Red - PDF cells, Green - predicted bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 11,
"page_no": 7,
"cluster": {
"id": 11,
"label": "picture",
"bbox": {
"l": 51.7,
"t": 380.5,
"r": 211.8,
"b": 443.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.83,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.7,
"r_y0": 386.4,
"r_x1": 85.7,
"r_y1": 386.4,
"r_x2": 85.7,
"r_y2": 381.8,
"r_x3": 53.7,
"r_y3": 381.8,
"coord_origin": "TOPLEFT"
},
"text": "Ground Truth",
"orig": "Ground Truth",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 168,
"label": "text",
"bbox": {
"l": 53.7,
"t": 381.8,
"r": 85.7,
"b": 386.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.7,
"r_y0": 386.4,
"r_x1": 85.7,
"r_y1": 386.4,
"r_x2": 85.7,
"r_y2": 381.8,
"r_x3": 53.7,
"r_y3": 381.8,
"coord_origin": "TOPLEFT"
},
"text": "Ground Truth",
"orig": "Ground Truth",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 13,
"page_no": 7,
"cluster": {
"id": 13,
"label": "picture",
"bbox": {
"l": 383.1,
"t": 381.2,
"r": 542.1,
"b": 442.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.79,
"cells": [
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 406.9,
"r_x1": 443.7,
"r_y1": 406.9,
"r_x2": 443.7,
"r_y2": 400.6,
"r_x3": 437.4,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 406.9,
"r_x1": 456.7,
"r_y1": 406.9,
"r_x2": 456.7,
"r_y2": 400.6,
"r_x3": 450.3,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 406.9,
"r_x1": 469.6,
"r_y1": 406.9,
"r_x2": 469.6,
"r_y2": 400.6,
"r_x3": 463.3,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 406.9,
"r_x1": 482.6,
"r_y1": 406.9,
"r_x2": 482.6,
"r_y2": 400.6,
"r_x3": 476.2,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 406.9,
"r_x1": 495.5,
"r_y1": 406.9,
"r_x2": 495.5,
"r_y2": 400.6,
"r_x3": 489.2,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 406.9,
"r_x1": 508.5,
"r_y1": 406.9,
"r_x2": 508.5,
"r_y2": 400.6,
"r_x3": 502.1,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "21",
"orig": "21",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 406.9,
"r_x1": 521.4,
"r_y1": 406.9,
"r_x2": 521.4,
"r_y2": 400.6,
"r_x3": 515.1,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "22",
"orig": "22",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 417.4,
"r_x1": 391.6,
"r_y1": 417.4,
"r_x2": 391.6,
"r_y2": 411.0,
"r_x3": 385.3,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "23",
"orig": "23",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 417.4,
"r_x1": 404.8,
"r_y1": 417.4,
"r_x2": 404.8,
"r_y2": 411.0,
"r_x3": 398.5,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "24",
"orig": "24",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 417.4,
"r_x1": 417.8,
"r_y1": 417.4,
"r_x2": 417.8,
"r_y2": 411.0,
"r_x3": 411.5,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "25",
"orig": "25",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 417.4,
"r_x1": 443.7,
"r_y1": 417.4,
"r_x2": 443.7,
"r_y2": 411.0,
"r_x3": 437.4,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "26",
"orig": "26",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 417.4,
"r_x1": 456.7,
"r_y1": 417.4,
"r_x2": 456.7,
"r_y2": 411.0,
"r_x3": 450.3,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "27",
"orig": "27",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 417.4,
"r_x1": 469.6,
"r_y1": 417.4,
"r_x2": 469.6,
"r_y2": 411.0,
"r_x3": 463.3,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "28",
"orig": "28",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 427.4,
"r_x1": 391.6,
"r_y1": 427.4,
"r_x2": 391.6,
"r_y2": 421.1,
"r_x3": 385.3,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 427.4,
"r_x1": 404.8,
"r_y1": 427.4,
"r_x2": 404.8,
"r_y2": 421.1,
"r_x3": 398.5,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "31",
"orig": "31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 427.4,
"r_x1": 417.8,
"r_y1": 427.4,
"r_x2": 417.8,
"r_y2": 421.1,
"r_x3": 411.5,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "32",
"orig": "32",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 427.4,
"r_x1": 430.7,
"r_y1": 427.4,
"r_x2": 430.7,
"r_y2": 421.1,
"r_x3": 424.4,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "33",
"orig": "33",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 427.4,
"r_x1": 443.7,
"r_y1": 427.4,
"r_x2": 443.7,
"r_y2": 421.1,
"r_x3": 437.4,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 427.4,
"r_x1": 456.7,
"r_y1": 427.4,
"r_x2": 456.7,
"r_y2": 421.1,
"r_x3": 450.3,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "35",
"orig": "35",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 427.4,
"r_x1": 469.6,
"r_y1": 427.4,
"r_x2": 469.6,
"r_y2": 421.1,
"r_x3": 463.3,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "36",
"orig": "36",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 427.4,
"r_x1": 482.6,
"r_y1": 427.4,
"r_x2": 482.6,
"r_y2": 421.1,
"r_x3": 476.2,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "37",
"orig": "37",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 427.4,
"r_x1": 495.5,
"r_y1": 427.4,
"r_x2": 495.5,
"r_y2": 421.1,
"r_x3": 489.2,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "38",
"orig": "38",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 427.4,
"r_x1": 508.5,
"r_y1": 427.4,
"r_x2": 508.5,
"r_y2": 421.1,
"r_x3": 502.1,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "39",
"orig": "39",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 427.4,
"r_x1": 521.4,
"r_y1": 427.4,
"r_x2": 521.4,
"r_y2": 421.1,
"r_x3": 515.1,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.0,
"r_y0": 427.4,
"r_x1": 534.4,
"r_y1": 427.4,
"r_x2": 534.4,
"r_y2": 421.1,
"r_x3": 528.0,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "41",
"orig": "41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 438.4,
"r_x1": 391.6,
"r_y1": 438.4,
"r_x2": 391.6,
"r_y2": 432.0,
"r_x3": 385.3,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "42",
"orig": "42",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 438.4,
"r_x1": 404.8,
"r_y1": 438.4,
"r_x2": 404.8,
"r_y2": 432.0,
"r_x3": 398.5,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "43",
"orig": "43",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 438.4,
"r_x1": 417.8,
"r_y1": 438.4,
"r_x2": 417.8,
"r_y2": 432.0,
"r_x3": 411.5,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "44",
"orig": "44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 438.4,
"r_x1": 430.7,
"r_y1": 438.4,
"r_x2": 430.7,
"r_y2": 432.0,
"r_x3": 424.4,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "45",
"orig": "45",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 438.4,
"r_x1": 443.7,
"r_y1": 438.4,
"r_x2": 443.7,
"r_y2": 432.0,
"r_x3": 437.4,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "46",
"orig": "46",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 438.4,
"r_x1": 456.7,
"r_y1": 438.4,
"r_x2": 456.7,
"r_y2": 432.0,
"r_x3": 450.3,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "47",
"orig": "47",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 438.4,
"r_x1": 469.6,
"r_y1": 438.4,
"r_x2": 469.6,
"r_y2": 432.0,
"r_x3": 463.3,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "48",
"orig": "48",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 438.4,
"r_x1": 482.6,
"r_y1": 438.4,
"r_x2": 482.6,
"r_y2": 432.0,
"r_x3": 476.2,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "49",
"orig": "49",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 438.4,
"r_x1": 495.5,
"r_y1": 438.4,
"r_x2": 495.5,
"r_y2": 432.0,
"r_x3": 489.2,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 438.4,
"r_x1": 508.5,
"r_y1": 438.4,
"r_x2": 508.5,
"r_y2": 432.0,
"r_x3": 502.1,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "51",
"orig": "51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 438.4,
"r_x1": 521.4,
"r_y1": 438.4,
"r_x2": 521.4,
"r_y2": 432.0,
"r_x3": 515.1,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "52",
"orig": "52",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.0,
"r_y0": 438.4,
"r_x1": 534.4,
"r_y1": 438.4,
"r_x2": 534.4,
"r_y2": 432.0,
"r_x3": 528.0,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "53",
"orig": "53",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 395.5,
"r_x1": 388.4,
"r_y1": 395.5,
"r_x2": 388.4,
"r_y2": 389.2,
"r_x3": 385.3,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 395.5,
"r_x1": 401.7,
"r_y1": 395.5,
"r_x2": 401.7,
"r_y2": 389.2,
"r_x3": 398.5,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 395.5,
"r_x1": 414.6,
"r_y1": 395.5,
"r_x2": 414.6,
"r_y2": 389.2,
"r_x3": 411.5,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 395.5,
"r_x1": 427.6,
"r_y1": 395.5,
"r_x2": 427.6,
"r_y2": 389.2,
"r_x3": 424.4,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 395.5,
"r_x1": 440.5,
"r_y1": 395.5,
"r_x2": 440.5,
"r_y2": 389.2,
"r_x3": 437.4,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 395.5,
"r_x1": 453.5,
"r_y1": 395.5,
"r_x2": 453.5,
"r_y2": 389.2,
"r_x3": 450.3,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 395.5,
"r_x1": 466.4,
"r_y1": 395.5,
"r_x2": 466.4,
"r_y2": 389.2,
"r_x3": 463.3,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 395.5,
"r_x1": 479.4,
"r_y1": 395.5,
"r_x2": 479.4,
"r_y2": 389.2,
"r_x3": 476.2,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 395.5,
"r_x1": 492.3,
"r_y1": 395.5,
"r_x2": 492.3,
"r_y2": 389.2,
"r_x3": 489.2,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 395.5,
"r_x1": 505.3,
"r_y1": 395.5,
"r_x2": 505.3,
"r_y2": 389.2,
"r_x3": 502.1,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 395.5,
"r_x1": 521.4,
"r_y1": 395.5,
"r_x2": 521.4,
"r_y2": 389.2,
"r_x3": 515.1,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.0,
"r_y0": 395.5,
"r_x1": 534.1,
"r_y1": 395.5,
"r_x2": 534.1,
"r_y2": 389.2,
"r_x3": 528.0,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 405.3,
"r_x1": 391.6,
"r_y1": 405.3,
"r_x2": 391.6,
"r_y2": 399.0,
"r_x3": 385.3,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 405.3,
"r_x1": 404.8,
"r_y1": 405.3,
"r_x2": 404.8,
"r_y2": 399.0,
"r_x3": 398.5,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 405.3,
"r_x1": 417.8,
"r_y1": 405.3,
"r_x2": 417.8,
"r_y2": 399.0,
"r_x3": 411.5,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 413.1,
"r_x1": 430.7,
"r_y1": 413.1,
"r_x2": 430.7,
"r_y2": 406.8,
"r_x3": 424.4,
"r_y3": 406.8,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.9,
"r_y0": 417.3,
"r_x1": 509.2,
"r_y1": 417.3,
"r_x2": 509.2,
"r_y2": 411.0,
"r_x3": 502.9,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "29",
"orig": "29",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.4,
"r_y0": 386.4,
"r_x1": 431.0,
"r_y1": 386.4,
"r_x2": 431.0,
"r_y2": 381.8,
"r_x3": 384.4,
"r_y3": 381.8,
"coord_origin": "TOPLEFT"
},
"text": "Predicted Structure",
"orig": "Predicted Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 169,
"label": "text",
"bbox": {
"l": 437.4,
"t": 400.6,
"r": 443.7,
"b": 406.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 406.9,
"r_x1": 443.7,
"r_y1": 406.9,
"r_x2": 443.7,
"r_y2": 400.6,
"r_x3": 437.4,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 170,
"label": "text",
"bbox": {
"l": 450.3,
"t": 400.6,
"r": 456.7,
"b": 406.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 406.9,
"r_x1": 456.7,
"r_y1": 406.9,
"r_x2": 456.7,
"r_y2": 400.6,
"r_x3": 450.3,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 171,
"label": "text",
"bbox": {
"l": 463.3,
"t": 400.6,
"r": 469.6,
"b": 406.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 406.9,
"r_x1": 469.6,
"r_y1": 406.9,
"r_x2": 469.6,
"r_y2": 400.6,
"r_x3": 463.3,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 172,
"label": "text",
"bbox": {
"l": 476.2,
"t": 400.6,
"r": 482.6,
"b": 406.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 406.9,
"r_x1": 482.6,
"r_y1": 406.9,
"r_x2": 482.6,
"r_y2": 400.6,
"r_x3": 476.2,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 173,
"label": "text",
"bbox": {
"l": 489.2,
"t": 400.6,
"r": 495.5,
"b": 406.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 406.9,
"r_x1": 495.5,
"r_y1": 406.9,
"r_x2": 495.5,
"r_y2": 400.6,
"r_x3": 489.2,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 174,
"label": "text",
"bbox": {
"l": 502.1,
"t": 400.6,
"r": 508.5,
"b": 406.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 406.9,
"r_x1": 508.5,
"r_y1": 406.9,
"r_x2": 508.5,
"r_y2": 400.6,
"r_x3": 502.1,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "21",
"orig": "21",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 175,
"label": "text",
"bbox": {
"l": 515.1,
"t": 400.6,
"r": 521.4,
"b": 406.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 406.9,
"r_x1": 521.4,
"r_y1": 406.9,
"r_x2": 521.4,
"r_y2": 400.6,
"r_x3": 515.1,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "22",
"orig": "22",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 176,
"label": "text",
"bbox": {
"l": 385.3,
"t": 411.0,
"r": 391.6,
"b": 417.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 417.4,
"r_x1": 391.6,
"r_y1": 417.4,
"r_x2": 391.6,
"r_y2": 411.0,
"r_x3": 385.3,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "23",
"orig": "23",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 177,
"label": "text",
"bbox": {
"l": 398.5,
"t": 411.0,
"r": 404.8,
"b": 417.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 417.4,
"r_x1": 404.8,
"r_y1": 417.4,
"r_x2": 404.8,
"r_y2": 411.0,
"r_x3": 398.5,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "24",
"orig": "24",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 178,
"label": "text",
"bbox": {
"l": 411.5,
"t": 411.0,
"r": 417.8,
"b": 417.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 417.4,
"r_x1": 417.8,
"r_y1": 417.4,
"r_x2": 417.8,
"r_y2": 411.0,
"r_x3": 411.5,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "25",
"orig": "25",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 179,
"label": "text",
"bbox": {
"l": 437.4,
"t": 411.0,
"r": 443.7,
"b": 417.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 417.4,
"r_x1": 443.7,
"r_y1": 417.4,
"r_x2": 443.7,
"r_y2": 411.0,
"r_x3": 437.4,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "26",
"orig": "26",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 180,
"label": "text",
"bbox": {
"l": 450.3,
"t": 411.0,
"r": 456.7,
"b": 417.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 417.4,
"r_x1": 456.7,
"r_y1": 417.4,
"r_x2": 456.7,
"r_y2": 411.0,
"r_x3": 450.3,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "27",
"orig": "27",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 181,
"label": "text",
"bbox": {
"l": 463.3,
"t": 411.0,
"r": 469.6,
"b": 417.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 417.4,
"r_x1": 469.6,
"r_y1": 417.4,
"r_x2": 469.6,
"r_y2": 411.0,
"r_x3": 463.3,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "28",
"orig": "28",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 182,
"label": "text",
"bbox": {
"l": 385.3,
"t": 421.1,
"r": 391.6,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 427.4,
"r_x1": 391.6,
"r_y1": 427.4,
"r_x2": 391.6,
"r_y2": 421.1,
"r_x3": 385.3,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 183,
"label": "text",
"bbox": {
"l": 398.5,
"t": 421.1,
"r": 404.8,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 427.4,
"r_x1": 404.8,
"r_y1": 427.4,
"r_x2": 404.8,
"r_y2": 421.1,
"r_x3": 398.5,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "31",
"orig": "31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 184,
"label": "text",
"bbox": {
"l": 411.5,
"t": 421.1,
"r": 417.8,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 427.4,
"r_x1": 417.8,
"r_y1": 427.4,
"r_x2": 417.8,
"r_y2": 421.1,
"r_x3": 411.5,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "32",
"orig": "32",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 185,
"label": "text",
"bbox": {
"l": 424.4,
"t": 421.1,
"r": 430.7,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 427.4,
"r_x1": 430.7,
"r_y1": 427.4,
"r_x2": 430.7,
"r_y2": 421.1,
"r_x3": 424.4,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "33",
"orig": "33",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 186,
"label": "text",
"bbox": {
"l": 437.4,
"t": 421.1,
"r": 443.7,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 427.4,
"r_x1": 443.7,
"r_y1": 427.4,
"r_x2": 443.7,
"r_y2": 421.1,
"r_x3": 437.4,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 187,
"label": "text",
"bbox": {
"l": 450.3,
"t": 421.1,
"r": 456.7,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 427.4,
"r_x1": 456.7,
"r_y1": 427.4,
"r_x2": 456.7,
"r_y2": 421.1,
"r_x3": 450.3,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "35",
"orig": "35",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 188,
"label": "text",
"bbox": {
"l": 463.3,
"t": 421.1,
"r": 469.6,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 427.4,
"r_x1": 469.6,
"r_y1": 427.4,
"r_x2": 469.6,
"r_y2": 421.1,
"r_x3": 463.3,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "36",
"orig": "36",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 189,
"label": "text",
"bbox": {
"l": 476.2,
"t": 421.1,
"r": 482.6,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 427.4,
"r_x1": 482.6,
"r_y1": 427.4,
"r_x2": 482.6,
"r_y2": 421.1,
"r_x3": 476.2,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "37",
"orig": "37",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 190,
"label": "text",
"bbox": {
"l": 489.2,
"t": 421.1,
"r": 495.5,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 427.4,
"r_x1": 495.5,
"r_y1": 427.4,
"r_x2": 495.5,
"r_y2": 421.1,
"r_x3": 489.2,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "38",
"orig": "38",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 191,
"label": "text",
"bbox": {
"l": 502.1,
"t": 421.1,
"r": 508.5,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 427.4,
"r_x1": 508.5,
"r_y1": 427.4,
"r_x2": 508.5,
"r_y2": 421.1,
"r_x3": 502.1,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "39",
"orig": "39",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 192,
"label": "text",
"bbox": {
"l": 515.1,
"t": 421.1,
"r": 521.4,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 427.4,
"r_x1": 521.4,
"r_y1": 427.4,
"r_x2": 521.4,
"r_y2": 421.1,
"r_x3": 515.1,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 193,
"label": "text",
"bbox": {
"l": 528.0,
"t": 421.1,
"r": 534.4,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.0,
"r_y0": 427.4,
"r_x1": 534.4,
"r_y1": 427.4,
"r_x2": 534.4,
"r_y2": 421.1,
"r_x3": 528.0,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "41",
"orig": "41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 194,
"label": "text",
"bbox": {
"l": 385.3,
"t": 432.0,
"r": 391.6,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 438.4,
"r_x1": 391.6,
"r_y1": 438.4,
"r_x2": 391.6,
"r_y2": 432.0,
"r_x3": 385.3,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "42",
"orig": "42",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 195,
"label": "text",
"bbox": {
"l": 398.5,
"t": 432.0,
"r": 404.8,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 438.4,
"r_x1": 404.8,
"r_y1": 438.4,
"r_x2": 404.8,
"r_y2": 432.0,
"r_x3": 398.5,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "43",
"orig": "43",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 196,
"label": "text",
"bbox": {
"l": 411.5,
"t": 432.0,
"r": 417.8,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 438.4,
"r_x1": 417.8,
"r_y1": 438.4,
"r_x2": 417.8,
"r_y2": 432.0,
"r_x3": 411.5,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "44",
"orig": "44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 197,
"label": "text",
"bbox": {
"l": 424.4,
"t": 432.0,
"r": 430.7,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 438.4,
"r_x1": 430.7,
"r_y1": 438.4,
"r_x2": 430.7,
"r_y2": 432.0,
"r_x3": 424.4,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "45",
"orig": "45",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 198,
"label": "text",
"bbox": {
"l": 437.4,
"t": 432.0,
"r": 443.7,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 438.4,
"r_x1": 443.7,
"r_y1": 438.4,
"r_x2": 443.7,
"r_y2": 432.0,
"r_x3": 437.4,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "46",
"orig": "46",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 199,
"label": "text",
"bbox": {
"l": 450.3,
"t": 432.0,
"r": 456.7,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 438.4,
"r_x1": 456.7,
"r_y1": 438.4,
"r_x2": 456.7,
"r_y2": 432.0,
"r_x3": 450.3,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "47",
"orig": "47",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 200,
"label": "text",
"bbox": {
"l": 463.3,
"t": 432.0,
"r": 469.6,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 438.4,
"r_x1": 469.6,
"r_y1": 438.4,
"r_x2": 469.6,
"r_y2": 432.0,
"r_x3": 463.3,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "48",
"orig": "48",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 201,
"label": "text",
"bbox": {
"l": 476.2,
"t": 432.0,
"r": 482.6,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 438.4,
"r_x1": 482.6,
"r_y1": 438.4,
"r_x2": 482.6,
"r_y2": 432.0,
"r_x3": 476.2,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "49",
"orig": "49",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 202,
"label": "text",
"bbox": {
"l": 489.2,
"t": 432.0,
"r": 495.5,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 438.4,
"r_x1": 495.5,
"r_y1": 438.4,
"r_x2": 495.5,
"r_y2": 432.0,
"r_x3": 489.2,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 203,
"label": "text",
"bbox": {
"l": 502.1,
"t": 432.0,
"r": 508.5,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 438.4,
"r_x1": 508.5,
"r_y1": 438.4,
"r_x2": 508.5,
"r_y2": 432.0,
"r_x3": 502.1,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "51",
"orig": "51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 204,
"label": "text",
"bbox": {
"l": 515.1,
"t": 432.0,
"r": 521.4,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 438.4,
"r_x1": 521.4,
"r_y1": 438.4,
"r_x2": 521.4,
"r_y2": 432.0,
"r_x3": 515.1,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "52",
"orig": "52",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 205,
"label": "text",
"bbox": {
"l": 528.0,
"t": 432.0,
"r": 534.4,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.0,
"r_y0": 438.4,
"r_x1": 534.4,
"r_y1": 438.4,
"r_x2": 534.4,
"r_y2": 432.0,
"r_x3": 528.0,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "53",
"orig": "53",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 206,
"label": "text",
"bbox": {
"l": 385.3,
"t": 389.2,
"r": 388.4,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 395.5,
"r_x1": 388.4,
"r_y1": 395.5,
"r_x2": 388.4,
"r_y2": 389.2,
"r_x3": 385.3,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 207,
"label": "text",
"bbox": {
"l": 398.5,
"t": 389.2,
"r": 401.7,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 395.5,
"r_x1": 401.7,
"r_y1": 395.5,
"r_x2": 401.7,
"r_y2": 389.2,
"r_x3": 398.5,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 208,
"label": "text",
"bbox": {
"l": 411.5,
"t": 389.2,
"r": 414.6,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 395.5,
"r_x1": 414.6,
"r_y1": 395.5,
"r_x2": 414.6,
"r_y2": 389.2,
"r_x3": 411.5,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 209,
"label": "text",
"bbox": {
"l": 424.4,
"t": 389.2,
"r": 427.6,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 395.5,
"r_x1": 427.6,
"r_y1": 395.5,
"r_x2": 427.6,
"r_y2": 389.2,
"r_x3": 424.4,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 210,
"label": "text",
"bbox": {
"l": 437.4,
"t": 389.2,
"r": 440.5,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 395.5,
"r_x1": 440.5,
"r_y1": 395.5,
"r_x2": 440.5,
"r_y2": 389.2,
"r_x3": 437.4,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 211,
"label": "text",
"bbox": {
"l": 450.3,
"t": 389.2,
"r": 453.5,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 395.5,
"r_x1": 453.5,
"r_y1": 395.5,
"r_x2": 453.5,
"r_y2": 389.2,
"r_x3": 450.3,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 212,
"label": "text",
"bbox": {
"l": 463.3,
"t": 389.2,
"r": 466.4,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 395.5,
"r_x1": 466.4,
"r_y1": 395.5,
"r_x2": 466.4,
"r_y2": 389.2,
"r_x3": 463.3,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 213,
"label": "text",
"bbox": {
"l": 476.2,
"t": 389.2,
"r": 479.4,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 395.5,
"r_x1": 479.4,
"r_y1": 395.5,
"r_x2": 479.4,
"r_y2": 389.2,
"r_x3": 476.2,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 214,
"label": "text",
"bbox": {
"l": 489.2,
"t": 389.2,
"r": 492.3,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 395.5,
"r_x1": 492.3,
"r_y1": 395.5,
"r_x2": 492.3,
"r_y2": 389.2,
"r_x3": 489.2,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 215,
"label": "text",
"bbox": {
"l": 502.1,
"t": 389.2,
"r": 505.3,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 395.5,
"r_x1": 505.3,
"r_y1": 395.5,
"r_x2": 505.3,
"r_y2": 389.2,
"r_x3": 502.1,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 216,
"label": "text",
"bbox": {
"l": 515.1,
"t": 389.2,
"r": 521.4,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 395.5,
"r_x1": 521.4,
"r_y1": 395.5,
"r_x2": 521.4,
"r_y2": 389.2,
"r_x3": 515.1,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 217,
"label": "text",
"bbox": {
"l": 528.0,
"t": 389.2,
"r": 534.1,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.0,
"r_y0": 395.5,
"r_x1": 534.1,
"r_y1": 395.5,
"r_x2": 534.1,
"r_y2": 389.2,
"r_x3": 528.0,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 218,
"label": "text",
"bbox": {
"l": 385.3,
"t": 399.0,
"r": 391.6,
"b": 405.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 405.3,
"r_x1": 391.6,
"r_y1": 405.3,
"r_x2": 391.6,
"r_y2": 399.0,
"r_x3": 385.3,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 219,
"label": "text",
"bbox": {
"l": 398.5,
"t": 399.0,
"r": 404.8,
"b": 405.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 405.3,
"r_x1": 404.8,
"r_y1": 405.3,
"r_x2": 404.8,
"r_y2": 399.0,
"r_x3": 398.5,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 220,
"label": "text",
"bbox": {
"l": 411.5,
"t": 399.0,
"r": 417.8,
"b": 405.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 405.3,
"r_x1": 417.8,
"r_y1": 405.3,
"r_x2": 417.8,
"r_y2": 399.0,
"r_x3": 411.5,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 221,
"label": "text",
"bbox": {
"l": 424.4,
"t": 406.8,
"r": 430.7,
"b": 413.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 413.1,
"r_x1": 430.7,
"r_y1": 413.1,
"r_x2": 430.7,
"r_y2": 406.8,
"r_x3": 424.4,
"r_y3": 406.8,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 222,
"label": "text",
"bbox": {
"l": 502.9,
"t": 411.0,
"r": 509.2,
"b": 417.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.9,
"r_y0": 417.3,
"r_x1": 509.2,
"r_y1": 417.3,
"r_x2": 509.2,
"r_y2": 411.0,
"r_x3": 502.9,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "29",
"orig": "29",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 223,
"label": "text",
"bbox": {
"l": 384.4,
"t": 381.8,
"r": 431.0,
"b": 386.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.4,
"r_y0": 386.4,
"r_x1": 431.0,
"r_y1": 386.4,
"r_x2": 431.0,
"r_y2": 381.8,
"r_x3": 384.4,
"r_y3": 381.8,
"coord_origin": "TOPLEFT"
},
"text": "Predicted Structure",
"orig": "Predicted Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "caption",
"id": 5,
"page_no": 7,
"cluster": {
"id": 5,
"label": "caption",
"bbox": {
"l": 62.6,
"t": 458.7,
"r": 532.6,
"b": 467.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.92,
"cells": [
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.6,
"r_y0": 467.6,
"r_x1": 532.6,
"r_y1": 467.6,
"r_x2": 532.6,
"r_y2": 458.7,
"r_x3": 62.6,
"r_y3": 458.7,
"coord_origin": "TOPLEFT"
},
"text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.",
"orig": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table."
},
{
"label": "section_header",
"id": 2,
"page_no": 7,
"cluster": {
"id": 2,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 491.4,
"r": 163.8,
"b": 501.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 501.2,
"r_x1": 64.4,
"r_y1": 501.2,
"r_x2": 64.4,
"r_y2": 491.4,
"r_x3": 50.1,
"r_y3": 491.4,
"coord_origin": "TOPLEFT"
},
"text": "5.5.",
"orig": "5.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.0,
"r_y0": 501.2,
"r_x1": 163.8,
"r_y1": 501.2,
"r_x2": 163.8,
"r_y2": 491.4,
"r_x3": 74.0,
"r_y3": 491.4,
"coord_origin": "TOPLEFT"
},
"text": "Qualitative Analysis",
"orig": "Qualitative Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5.5. Qualitative Analysis"
},
{
"label": "text",
"id": 1,
"page_no": 7,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.1,
"t": 536.9,
"r": 286.4,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 545.8,
"r_x1": 286.4,
"r_y1": 545.8,
"r_x2": 286.4,
"r_y2": 536.9,
"r_x3": 62.1,
"r_y3": 536.9,
"coord_origin": "TOPLEFT"
},
"text": "We showcase several visualizations for the different",
"orig": "We showcase several visualizations for the different",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 557.7,
"r_x1": 211.2,
"r_y1": 557.7,
"r_x2": 211.2,
"r_y2": 548.8,
"r_x3": 50.1,
"r_y3": 548.8,
"coord_origin": "TOPLEFT"
},
"text": "components of our network on various",
"orig": "components of our network on various",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 215.1,
"r_y0": 557.5,
"r_x1": 259.2,
"r_y1": 557.5,
"r_x2": 259.2,
"r_y2": 548.9,
"r_x3": 215.1,
"r_y3": 548.9,
"coord_origin": "TOPLEFT"
},
"text": "\u201ccomplex\u201d",
"orig": "\u201ccomplex\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.1,
"r_y0": 557.7,
"r_x1": 286.4,
"r_y1": 557.7,
"r_x2": 286.4,
"r_y2": 548.8,
"r_x3": 263.1,
"r_y3": 548.8,
"coord_origin": "TOPLEFT"
},
"text": "tables",
"orig": "tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 569.7,
"r_x1": 286.4,
"r_y1": 569.7,
"r_x2": 286.4,
"r_y2": 560.8,
"r_x3": 50.1,
"r_y3": 560.8,
"coord_origin": "TOPLEFT"
},
"text": "within datasets presented in this work in Fig. 5 and Fig. 6",
"orig": "within datasets presented in this work in Fig. 5 and Fig. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 581.6,
"r_x1": 286.4,
"r_y1": 581.6,
"r_x2": 286.4,
"r_y2": 572.7,
"r_x3": 50.1,
"r_y3": 572.7,
"coord_origin": "TOPLEFT"
},
"text": "As it is shown, our model is able to predict bounding boxes",
"orig": "As it is shown, our model is able to predict bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 593.6,
"r_x1": 286.4,
"r_y1": 593.6,
"r_x2": 286.4,
"r_y2": 584.7,
"r_x3": 50.1,
"r_y3": 584.7,
"coord_origin": "TOPLEFT"
},
"text": "for all table cells, even for the empty ones. Additionally,",
"orig": "for all table cells, even for the empty ones. Additionally,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 605.6,
"r_x1": 286.4,
"r_y1": 605.6,
"r_x2": 286.4,
"r_y2": 596.6,
"r_x3": 50.1,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "our post-processing techniques can extract the cell content",
"orig": "our post-processing techniques can extract the cell content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 617.5,
"r_x1": 286.4,
"r_y1": 617.5,
"r_x2": 286.4,
"r_y2": 608.6,
"r_x3": 50.1,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "by matching the predicted bounding boxes to the PDF cells",
"orig": "by matching the predicted bounding boxes to the PDF cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 629.5,
"r_x1": 286.4,
"r_y1": 629.5,
"r_x2": 286.4,
"r_y2": 620.6,
"r_x3": 50.1,
"r_y3": 620.6,
"coord_origin": "TOPLEFT"
},
"text": "based on their overlap and spatial proximity. The left part",
"orig": "based on their overlap and spatial proximity. The left part",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 641.4,
"r_x1": 286.4,
"r_y1": 641.4,
"r_x2": 286.4,
"r_y2": 632.5,
"r_x3": 50.1,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": "of Fig. 5 demonstrates also the adaptability of our method",
"orig": "of Fig. 5 demonstrates also the adaptability of our method",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 653.4,
"r_x1": 286.4,
"r_y1": 653.4,
"r_x2": 286.4,
"r_y2": 644.5,
"r_x3": 50.1,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "to any language, as it can successfully extract Japanese",
"orig": "to any language, as it can successfully extract Japanese",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 665.3,
"r_x1": 286.4,
"r_y1": 665.3,
"r_x2": 286.4,
"r_y2": 656.4,
"r_x3": 50.1,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "text, although the training set contains only English content.",
"orig": "text, although the training set contains only English content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.3,
"r_x1": 286.4,
"r_y1": 677.3,
"r_x2": 286.4,
"r_y2": 668.4,
"r_x3": 50.1,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "We provide more visualizations including the intermediate",
"orig": "We provide more visualizations including the intermediate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 689.2,
"r_x1": 286.4,
"r_y1": 689.2,
"r_x2": 286.4,
"r_y2": 680.3,
"r_x3": 50.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "steps in the supplementary material. Overall these illustra-",
"orig": "steps in the supplementary material. Overall these illustra-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "tions justify the versatility of our method across a diverse",
"orig": "tions justify the versatility of our method across a diverse",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 226.9,
"r_y1": 713.2,
"r_x2": 226.9,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "range of table appearances and content type.",
"orig": "range of table appearances and content type.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "We showcase several visualizations for the different components of our network on various \"complex\" tables within datasets presented in this work in Fig. 5 and Fig. 6 As it is shown, our model is able to predict bounding boxes for all table cells, even for the empty ones. Additionally, our post-processing techniques can extract the cell content by matching the predicted bounding boxes to the PDF cells based on their overlap and spatial proximity. The left part of Fig. 5 demonstrates also the adaptability of our method to any language, as it can successfully extract Japanese text, although the training set contains only English content. We provide more visualizations including the intermediate steps in the supplementary material. Overall these illustrations justify the versatility of our method across a diverse range of table appearances and content type."
},
{
"label": "section_header",
"id": 4,
"page_no": 7,
"cluster": {
"id": 4,
"label": "section_header",
"bbox": {
"l": 308.9,
"t": 490.7,
"r": 460.8,
"b": 501.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 501.5,
"r_x1": 316.1,
"r_y1": 501.5,
"r_x2": 316.1,
"r_y2": 490.7,
"r_x3": 308.9,
"r_y3": 490.7,
"coord_origin": "TOPLEFT"
},
"text": "6.",
"orig": "6.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 325.7,
"r_y0": 501.5,
"r_x1": 460.8,
"r_y1": 501.5,
"r_x2": 460.8,
"r_y2": 490.7,
"r_x3": 325.7,
"r_y3": 490.7,
"coord_origin": "TOPLEFT"
},
"text": "Future Work & Conclusion",
"orig": "Future Work & Conclusion",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "6. Future Work & Conclusion"
},
{
"label": "text",
"id": 0,
"page_no": 7,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 308.9,
"t": 512.9,
"r": 545.1,
"b": 653.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 521.8,
"r_x1": 545.1,
"r_y1": 521.8,
"r_x2": 545.1,
"r_y2": 512.9,
"r_x3": 320.8,
"r_y3": 512.9,
"coord_origin": "TOPLEFT"
},
"text": "In this paper, we presented TableFormer an end-to-end",
"orig": "In this paper, we presented TableFormer an end-to-end",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 533.8,
"r_x1": 545.1,
"r_y1": 533.8,
"r_x2": 545.1,
"r_y2": 524.8,
"r_x3": 308.9,
"r_y3": 524.8,
"coord_origin": "TOPLEFT"
},
"text": "transformer based approach to predict table structures and",
"orig": "transformer based approach to predict table structures and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 545.7,
"r_x1": 545.1,
"r_y1": 545.7,
"r_x2": 545.1,
"r_y2": 536.8,
"r_x3": 308.9,
"r_y3": 536.8,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes of cells from an image. This approach en-",
"orig": "bounding boxes of cells from an image. This approach en-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 557.7,
"r_x1": 545.1,
"r_y1": 557.7,
"r_x2": 545.1,
"r_y2": 548.8,
"r_x3": 308.9,
"r_y3": 548.8,
"coord_origin": "TOPLEFT"
},
"text": "ables us to recreate the table structure, and extract the cell",
"orig": "ables us to recreate the table structure, and extract the cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 569.6,
"r_x1": 545.1,
"r_y1": 569.6,
"r_x2": 545.1,
"r_y2": 560.7,
"r_x3": 308.9,
"r_y3": 560.7,
"coord_origin": "TOPLEFT"
},
"text": "content from PDF or OCR by using bounding boxes. Ad-",
"orig": "content from PDF or OCR by using bounding boxes. Ad-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 581.6,
"r_x1": 545.1,
"r_y1": 581.6,
"r_x2": 545.1,
"r_y2": 572.7,
"r_x3": 308.9,
"r_y3": 572.7,
"coord_origin": "TOPLEFT"
},
"text": "ditionally, it provides the versatility required in real-world",
"orig": "ditionally, it provides the versatility required in real-world",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 593.5,
"r_x1": 545.1,
"r_y1": 593.5,
"r_x2": 545.1,
"r_y2": 584.6,
"r_x3": 308.9,
"r_y3": 584.6,
"coord_origin": "TOPLEFT"
},
"text": "scenarios when dealing with various types of PDF docu-",
"orig": "scenarios when dealing with various types of PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 605.5,
"r_x1": 400.5,
"r_y1": 605.5,
"r_x2": 400.5,
"r_y2": 596.6,
"r_x3": 308.9,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "ments, and languages.",
"orig": "ments, and languages.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.4,
"r_y0": 605.5,
"r_x1": 545.1,
"r_y1": 605.5,
"r_x2": 545.1,
"r_y2": 596.6,
"r_x3": 408.4,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "Furthermore, our method outper-",
"orig": "Furthermore, our method outper-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 212,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 617.4,
"r_x1": 545.1,
"r_y1": 617.4,
"r_x2": 545.1,
"r_y2": 608.5,
"r_x3": 308.9,
"r_y3": 608.5,
"coord_origin": "TOPLEFT"
},
"text": "forms all state-of-the-arts with a wide margin. Finally, we",
"orig": "forms all state-of-the-arts with a wide margin. Finally, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 213,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 629.4,
"r_x1": 545.1,
"r_y1": 629.4,
"r_x2": 545.1,
"r_y2": 620.5,
"r_x3": 308.9,
"r_y3": 620.5,
"coord_origin": "TOPLEFT"
},
"text": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-",
"orig": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 214,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 641.4,
"r_x1": 545.1,
"r_y1": 641.4,
"r_x2": 545.1,
"r_y2": 632.4,
"r_x3": 308.9,
"r_y3": 632.4,
"coord_origin": "TOPLEFT"
},
"text": "erated dataset that reinforces missing characteristics from",
"orig": "erated dataset that reinforces missing characteristics from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 215,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 653.3,
"r_x1": 365.9,
"r_y1": 653.3,
"r_x2": 365.9,
"r_y2": 644.4,
"r_x3": 308.9,
"r_y3": 644.4,
"coord_origin": "TOPLEFT"
},
"text": "other datasets.",
"orig": "other datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "In this paper, we presented TableFormer an end-to-end transformer based approach to predict table structures and bounding boxes of cells from an image. This approach enables us to recreate the table structure, and extract the cell content from PDF or OCR by using bounding boxes. Additionally, it provides the versatility required in real-world scenarios when dealing with various types of PDF documents, and languages. Furthermore, our method outperforms all state-of-the-arts with a wide margin. Finally, we introduce \"SynthTabNet\" a challenging synthetically generated dataset that reinforces missing characteristics from other datasets."
},
{
"label": "section_header",
"id": 3,
"page_no": 7,
"cluster": {
"id": 3,
"label": "section_header",
"bbox": {
"l": 308.9,
"t": 672.1,
"r": 364.4,
"b": 682.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 216,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 682.8,
"r_x1": 364.4,
"r_y1": 682.8,
"r_x2": 364.4,
"r_y2": 672.1,
"r_x3": 308.9,
"r_y3": 672.1,
"coord_origin": "TOPLEFT"
},
"text": "References",
"orig": "References",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "References"
},
{
"label": "list_item",
"id": 10,
"page_no": 7,
"cluster": {
"id": 10,
"label": "list_item",
"bbox": {
"l": 313.3,
"t": 694.0,
"r": 545.1,
"b": 712.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.83,
"cells": [
{
"index": 217,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.3,
"r_y0": 702.0,
"r_x1": 323.8,
"r_y1": 702.0,
"r_x2": 323.8,
"r_y2": 694.0,
"r_x3": 313.3,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "[1]",
"orig": "[1]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 218,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.1,
"r_y0": 702.0,
"r_x1": 545.1,
"r_y1": 702.0,
"r_x2": 545.1,
"r_y2": 694.0,
"r_x3": 326.1,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas",
"orig": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 219,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 712.9,
"r_x1": 545.1,
"r_y1": 712.9,
"r_x2": 545.1,
"r_y2": 704.9,
"r_x3": 328.8,
"r_y3": 704.9,
"coord_origin": "TOPLEFT"
},
"text": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-",
"orig": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[1] Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-"
},
{
"label": "page_footer",
"id": 9,
"page_no": 7,
"cluster": {
"id": 9,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.87,
"cells": [
{
"index": 220,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "8"
},
{
"label": "picture",
"id": 15,
"page_no": 7,
"cluster": {
"id": 15,
"label": "picture",
"bbox": {
"l": 305.6,
"t": 98.7,
"r": 554.8,
"b": 180.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.77,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 14,
"page_no": 7,
"cluster": {
"id": 14,
"label": "picture",
"bbox": {
"l": 50.0,
"t": 103.7,
"r": 301.6,
"b": 187.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.79,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
}
],
"body": [
{
"label": "caption",
"id": 18,
"page_no": 7,
"cluster": {
"id": 18,
"label": "caption",
"bbox": {
"l": 53.8,
"t": 208.2,
"r": 385.9,
"b": 216.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.6,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.8,
"r_y0": 216.1,
"r_x1": 62.2,
"r_y1": 216.1,
"r_x2": 62.2,
"r_y2": 208.2,
"r_x3": 53.8,
"r_y3": 208.2,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.4,
"r_y0": 216.1,
"r_x1": 385.9,
"r_y1": 216.1,
"r_x2": 385.9,
"r_y2": 208.2,
"r_x3": 66.4,
"r_y3": 208.2,
"coord_origin": "TOPLEFT"
},
"text": "Structure predicted by TableFormer, with superimposed matched PDF cell text:",
"orig": "Structure predicted by TableFormer, with superimposed matched PDF cell text:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:"
},
{
"label": "section_header",
"id": 29,
"page_no": 7,
"cluster": {
"id": 29,
"label": "section_header",
"bbox": {
"l": 53.8,
"t": 94.3,
"r": 284.3,
"b": 102.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.46,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.8,
"r_y0": 102.2,
"r_x1": 284.3,
"r_y1": 102.2,
"r_x2": 284.3,
"r_y2": 94.3,
"r_x3": 53.8,
"r_y3": 94.3,
"coord_origin": "TOPLEFT"
},
"text": "Japanese language (previously unseen by TableFormer):",
"orig": "Japanese language (previously unseen by TableFormer):",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Japanese language (previously unseen by TableFormer):"
},
{
"label": "section_header",
"id": 31,
"page_no": 7,
"cluster": {
"id": 31,
"label": "section_header",
"bbox": {
"l": 304.8,
"t": 94.3,
"r": 431.1,
"b": 102.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.46,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 304.8,
"r_y0": 102.2,
"r_x1": 431.1,
"r_y1": 102.2,
"r_x2": 431.1,
"r_y2": 94.3,
"r_x3": 304.8,
"r_y3": 94.3,
"coord_origin": "TOPLEFT"
},
"text": "Example table from FinTabNet:",
"orig": "Example table from FinTabNet:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Example table from FinTabNet:"
},
{
"label": "list_item",
"id": 20,
"page_no": 7,
"cluster": {
"id": 20,
"label": "list_item",
"bbox": {
"l": 53.3,
"t": 78.7,
"r": 61.6,
"b": 86.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.58,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.3,
"r_y0": 86.6,
"r_x1": 61.6,
"r_y1": 86.6,
"r_x2": 61.6,
"r_y2": 78.7,
"r_x3": 53.3,
"r_y3": 78.7,
"coord_origin": "TOPLEFT"
},
"text": "a.",
"orig": "a.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "a."
},
{
"label": "list_item",
"id": 21,
"page_no": 7,
"cluster": {
"id": 21,
"label": "list_item",
"bbox": {
"l": 65.7,
"t": 78.7,
"r": 499.6,
"b": 86.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.54,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.7,
"r_y0": 86.6,
"r_x1": 499.6,
"r_y1": 86.6,
"r_x2": 499.6,
"r_y2": 78.7,
"r_x3": 65.7,
"r_y3": 78.7,
"coord_origin": "TOPLEFT"
},
"text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells",
"orig": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells"
},
{
"label": "table",
"id": 8,
"page_no": 7,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 53.6,
"t": 218.9,
"r": 298.6,
"b": 292.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.9,
"r_y0": 226.4,
"r_x1": 241.0,
"r_y1": 226.4,
"r_x2": 241.0,
"r_y2": 222.2,
"r_x3": 209.9,
"r_y3": 222.2,
"coord_origin": "TOPLEFT"
},
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.8,
"r_y0": 226.4,
"r_x1": 284.5,
"r_y1": 226.4,
"r_x2": 284.5,
"r_y2": 222.2,
"r_x3": 263.8,
"r_y3": 222.2,
"coord_origin": "TOPLEFT"
},
"text": "\u53c2\u8003\u6587\u732e",
"orig": "\u53c2\u8003\u6587\u732e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.2,
"r_y0": 233.8,
"r_x1": 120.6,
"r_y1": 233.8,
"r_x2": 120.6,
"r_y2": 229.7,
"r_x3": 110.2,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u51fa\u5178",
"orig": "\u51fa\u5178",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.4,
"r_y0": 233.8,
"r_x1": 196.1,
"r_y1": 233.8,
"r_x2": 196.1,
"r_y2": 229.7,
"r_x3": 175.4,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u30d5\u30a1\u30a4\u30eb",
"orig": "\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.1,
"r_y0": 233.8,
"r_x1": 201.3,
"r_y1": 233.8,
"r_x2": 201.3,
"r_y2": 229.7,
"r_x3": 196.1,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u6570",
"orig": "\u6570",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.6,
"r_y0": 233.8,
"r_x1": 220.0,
"r_y1": 233.8,
"r_x2": 220.0,
"r_y2": 229.7,
"r_x3": 209.6,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.2,
"r_y0": 233.8,
"r_x1": 244.8,
"r_y1": 233.8,
"r_x2": 244.8,
"r_y2": 229.7,
"r_x3": 229.2,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.1,
"r_y0": 233.8,
"r_x1": 266.5,
"r_y1": 233.8,
"r_x2": 266.5,
"r_y2": 229.7,
"r_x3": 256.1,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.4,
"r_y0": 233.8,
"r_x1": 293.9,
"r_y1": 233.8,
"r_x2": 293.9,
"r_y2": 229.7,
"r_x3": 278.4,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 240.8,
"r_x1": 162.7,
"r_y1": 240.8,
"r_x2": 162.7,
"r_y2": 236.4,
"r_x3": 55.5,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "Association for Computational Linguistics(ACL2003)",
"orig": "Association for Computational Linguistics(ACL2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 240.8,
"r_x1": 189.6,
"r_y1": 240.8,
"r_x2": 189.6,
"r_y2": 236.4,
"r_x3": 184.4,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 240.8,
"r_x1": 214.2,
"r_y1": 240.8,
"r_x2": 214.2,
"r_y2": 236.4,
"r_x3": 209.0,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.9,
"r_y0": 240.8,
"r_x1": 237.5,
"r_y1": 240.8,
"r_x2": 237.5,
"r_y2": 236.4,
"r_x3": 234.9,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 240.8,
"r_x1": 264.6,
"r_y1": 240.8,
"r_x2": 264.6,
"r_y2": 236.4,
"r_x3": 256.9,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.1,
"r_y0": 240.8,
"r_x1": 286.6,
"r_y1": 240.8,
"r_x2": 286.6,
"r_y2": 236.4,
"r_x3": 284.1,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 247.0,
"r_x1": 139.7,
"r_y1": 247.0,
"r_x2": 139.7,
"r_y2": 242.6,
"r_x3": 55.5,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "Computational Linguistics(COLING2002)",
"orig": "Computational Linguistics(COLING2002)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 247.0,
"r_x1": 190.9,
"r_y1": 247.0,
"r_x2": 190.9,
"r_y2": 242.6,
"r_x3": 183.1,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 247.0,
"r_x1": 215.4,
"r_y1": 247.0,
"r_x2": 215.4,
"r_y2": 242.6,
"r_x3": 207.7,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.9,
"r_y0": 247.0,
"r_x1": 237.5,
"r_y1": 247.0,
"r_x2": 237.5,
"r_y2": 242.6,
"r_x3": 234.9,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 247.0,
"r_x1": 264.6,
"r_y1": 247.0,
"r_x2": 264.6,
"r_y2": 242.6,
"r_x3": 256.9,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.1,
"r_y0": 247.0,
"r_x1": 286.6,
"r_y1": 247.0,
"r_x2": 286.6,
"r_y2": 242.6,
"r_x3": 284.1,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 254.0,
"r_x1": 97.0,
"r_y1": 254.0,
"r_x2": 97.0,
"r_y2": 249.8,
"r_x3": 55.5,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 92.7,
"r_y0": 253.9,
"r_x1": 103.0,
"r_y1": 253.9,
"r_x2": 103.0,
"r_y2": 249.6,
"r_x3": 92.7,
"r_y3": 249.6,
"coord_origin": "TOPLEFT"
},
"text": "2003",
"orig": "2003",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.0,
"r_y0": 254.0,
"r_x1": 129.0,
"r_y1": 254.0,
"r_x2": 129.0,
"r_y2": 249.8,
"r_x3": 103.0,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"orig": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 253.2,
"r_x1": 190.9,
"r_y1": 253.2,
"r_x2": 190.9,
"r_y2": 248.8,
"r_x3": 183.1,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 253.2,
"r_x1": 212.9,
"r_y1": 253.2,
"r_x2": 212.9,
"r_y2": 248.8,
"r_x3": 210.3,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 253.2,
"r_x1": 240.0,
"r_y1": 253.2,
"r_x2": 240.0,
"r_y2": 248.8,
"r_x3": 232.3,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "142",
"orig": "142",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 253.2,
"r_x1": 264.6,
"r_y1": 253.2,
"r_x2": 264.6,
"r_y2": 248.8,
"r_x3": 256.9,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "223",
"orig": "223",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 253.2,
"r_x1": 289.2,
"r_y1": 253.2,
"r_x2": 289.2,
"r_y2": 248.8,
"r_x3": 281.5,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 261.5,
"r_x1": 91.8,
"r_y1": 261.5,
"r_x2": 91.8,
"r_y2": 257.3,
"r_x3": 55.5,
"r_y3": 257.3,
"coord_origin": "TOPLEFT"
},
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.1,
"r_y0": 261.4,
"r_x1": 93.2,
"r_y1": 261.4,
"r_x2": 93.2,
"r_y2": 257.1,
"r_x3": 88.1,
"r_y3": 257.1,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.2,
"r_y0": 261.5,
"r_x1": 119.1,
"r_y1": 261.5,
"r_x2": 119.1,
"r_y2": 257.3,
"r_x3": 93.2,
"r_y3": 257.3,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.5,
"r_y0": 261.4,
"r_x1": 129.9,
"r_y1": 261.4,
"r_x2": 129.9,
"r_y2": 257.1,
"r_x3": 116.5,
"r_y3": 257.1,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 260.7,
"r_x1": 190.9,
"r_y1": 260.7,
"r_x2": 190.9,
"r_y2": 256.3,
"r_x3": 183.1,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "177",
"orig": "177",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 260.7,
"r_x1": 212.9,
"r_y1": 260.7,
"r_x2": 212.9,
"r_y2": 256.3,
"r_x3": 210.3,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 260.7,
"r_x1": 240.0,
"r_y1": 260.7,
"r_x2": 240.0,
"r_y2": 256.3,
"r_x3": 232.3,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "176",
"orig": "176",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 260.7,
"r_x1": 264.6,
"r_y1": 260.7,
"r_x2": 264.6,
"r_y2": 256.3,
"r_x3": 256.9,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 260.7,
"r_x1": 289.2,
"r_y1": 260.7,
"r_x2": 289.2,
"r_y2": 256.3,
"r_x3": 281.5,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "236",
"orig": "236",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 268.7,
"r_x1": 60.7,
"r_y1": 268.7,
"r_x2": 60.7,
"r_y2": 264.5,
"r_x3": 55.5,
"r_y3": 264.5,
"coord_origin": "TOPLEFT"
},
"text": "\u7b2c",
"orig": "\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.2,
"r_y0": 268.7,
"r_x1": 65.3,
"r_y1": 268.7,
"r_x2": 65.3,
"r_y2": 264.3,
"r_x3": 60.2,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.3,
"r_y0": 268.7,
"r_x1": 122.4,
"r_y1": 268.7,
"r_x2": 122.4,
"r_y2": 264.5,
"r_x3": 65.3,
"r_y3": 264.5,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.5,
"r_y0": 268.7,
"r_x1": 129.9,
"r_y1": 268.7,
"r_x2": 129.9,
"r_y2": 264.3,
"r_x3": 116.5,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 267.9,
"r_x1": 190.9,
"r_y1": 267.9,
"r_x2": 190.9,
"r_y2": 263.5,
"r_x3": 183.1,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "208",
"orig": "208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 267.9,
"r_x1": 212.9,
"r_y1": 267.9,
"r_x2": 212.9,
"r_y2": 263.5,
"r_x3": 210.3,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 267.9,
"r_x1": 240.0,
"r_y1": 267.9,
"r_x2": 240.0,
"r_y2": 263.5,
"r_x3": 232.3,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "203",
"orig": "203",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 267.9,
"r_x1": 264.6,
"r_y1": 267.9,
"r_x2": 264.6,
"r_y2": 263.5,
"r_x3": 256.9,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "152",
"orig": "152",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 267.9,
"r_x1": 289.2,
"r_y1": 267.9,
"r_x2": 289.2,
"r_y2": 263.5,
"r_x3": 281.5,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "244",
"orig": "244",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 275.9,
"r_x1": 107.4,
"r_y1": 275.9,
"r_x2": 107.4,
"r_y2": 271.7,
"r_x3": 55.5,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 102.0,
"r_y0": 275.9,
"r_x1": 109.7,
"r_y1": 275.9,
"r_x2": 109.7,
"r_y2": 271.5,
"r_x3": 102.0,
"r_y3": 271.5,
"coord_origin": "TOPLEFT"
},
"text": "146",
"orig": "146",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 109.7,
"r_y0": 275.9,
"r_x1": 114.9,
"r_y1": 275.9,
"r_x2": 114.9,
"r_y2": 271.7,
"r_x3": 109.7,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u301c",
"orig": "\u301c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 114.4,
"r_y0": 275.9,
"r_x1": 122.1,
"r_y1": 275.9,
"r_x2": 122.1,
"r_y2": 271.5,
"r_x3": 114.4,
"r_y3": 271.5,
"coord_origin": "TOPLEFT"
},
"text": "155",
"orig": "155",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.1,
"r_y0": 275.9,
"r_x1": 127.3,
"r_y1": 275.9,
"r_x2": 127.3,
"r_y2": 271.7,
"r_x3": 122.1,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u56de",
"orig": "\u56de",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 275.1,
"r_x1": 189.6,
"r_y1": 275.1,
"r_x2": 189.6,
"r_y2": 270.8,
"r_x3": 184.4,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "98",
"orig": "98",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 275.1,
"r_x1": 212.9,
"r_y1": 275.1,
"r_x2": 212.9,
"r_y2": 270.8,
"r_x3": 210.3,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.6,
"r_y0": 275.1,
"r_x1": 238.8,
"r_y1": 275.1,
"r_x2": 238.8,
"r_y2": 270.8,
"r_x3": 233.6,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 275.1,
"r_x1": 264.6,
"r_y1": 275.1,
"r_x2": 264.6,
"r_y2": 270.8,
"r_x3": 256.9,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 275.1,
"r_x1": 289.2,
"r_y1": 275.1,
"r_x2": 289.2,
"r_y2": 270.8,
"r_x3": 281.5,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "232",
"orig": "232",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 283.4,
"r_x1": 68.7,
"r_y1": 283.4,
"r_x2": 68.7,
"r_y2": 279.0,
"r_x3": 55.5,
"r_y3": 279.0,
"coord_origin": "TOPLEFT"
},
"text": "WWW",
"orig": "WWW",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.7,
"r_y0": 283.4,
"r_x1": 110.2,
"r_y1": 283.4,
"r_x2": 110.2,
"r_y2": 279.2,
"r_x3": 68.7,
"r_y3": 279.2,
"coord_origin": "TOPLEFT"
},
"text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 282.3,
"r_x1": 190.9,
"r_y1": 282.3,
"r_x2": 190.9,
"r_y2": 278.0,
"r_x3": 183.1,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "107",
"orig": "107",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 282.3,
"r_x1": 214.2,
"r_y1": 282.3,
"r_x2": 214.2,
"r_y2": 278.0,
"r_x3": 209.0,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "73",
"orig": "73",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.6,
"r_y0": 282.3,
"r_x1": 238.8,
"r_y1": 282.3,
"r_x2": 238.8,
"r_y2": 278.0,
"r_x3": 233.6,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 282.3,
"r_x1": 264.6,
"r_y1": 282.3,
"r_x2": 264.6,
"r_y2": 278.0,
"r_x3": 256.9,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 282.8,
"r_y0": 282.3,
"r_x1": 287.9,
"r_y1": 282.3,
"r_x2": 287.9,
"r_y2": 278.0,
"r_x3": 282.8,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 169.6,
"r_y0": 290.6,
"r_x1": 174.8,
"r_y1": 290.6,
"r_x2": 174.8,
"r_y2": 286.5,
"r_x3": 169.6,
"r_y3": 286.5,
"coord_origin": "TOPLEFT"
},
"text": "\u8a08",
"orig": "\u8a08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 289.8,
"r_x1": 190.9,
"r_y1": 289.8,
"r_x2": 190.9,
"r_y2": 285.5,
"r_x3": 183.1,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "945",
"orig": "945",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 289.8,
"r_x1": 215.4,
"r_y1": 289.8,
"r_x2": 215.4,
"r_y2": 285.5,
"r_x3": 207.7,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "294",
"orig": "294",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 289.8,
"r_x1": 240.0,
"r_y1": 289.8,
"r_x2": 240.0,
"r_y2": 285.5,
"r_x3": 232.3,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "651",
"orig": "651",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.8,
"r_y0": 289.8,
"r_x1": 265.8,
"r_y1": 289.8,
"r_x2": 265.8,
"r_y2": 285.5,
"r_x3": 255.8,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "1122",
"orig": "1122",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 289.8,
"r_x1": 289.2,
"r_y1": 289.8,
"r_x2": 289.2,
"r_y2": 285.5,
"r_x3": 281.5,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "955",
"orig": "955",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 55,
"label": "text",
"bbox": {
"l": 209.9,
"t": 222.2,
"r": 241.0,
"b": 226.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.9,
"r_y0": 226.4,
"r_x1": 241.0,
"r_y1": 226.4,
"r_x2": 241.0,
"r_y2": 222.2,
"r_x3": 209.9,
"r_y3": 222.2,
"coord_origin": "TOPLEFT"
},
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 263.8,
"t": 222.2,
"r": 284.5,
"b": 226.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.8,
"r_y0": 226.4,
"r_x1": 284.5,
"r_y1": 226.4,
"r_x2": 284.5,
"r_y2": 222.2,
"r_x3": 263.8,
"r_y3": 222.2,
"coord_origin": "TOPLEFT"
},
"text": "\u53c2\u8003\u6587\u732e",
"orig": "\u53c2\u8003\u6587\u732e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 110.2,
"t": 229.7,
"r": 120.6,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.2,
"r_y0": 233.8,
"r_x1": 120.6,
"r_y1": 233.8,
"r_x2": 120.6,
"r_y2": 229.7,
"r_x3": 110.2,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u51fa\u5178",
"orig": "\u51fa\u5178",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 175.4,
"t": 229.7,
"r": 196.1,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 175.4,
"r_y0": 233.8,
"r_x1": 196.1,
"r_y1": 233.8,
"r_x2": 196.1,
"r_y2": 229.7,
"r_x3": 175.4,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u30d5\u30a1\u30a4\u30eb",
"orig": "\u30d5\u30a1\u30a4\u30eb",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 196.1,
"t": 229.7,
"r": 201.3,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 196.1,
"r_y0": 233.8,
"r_x1": 201.3,
"r_y1": 233.8,
"r_x2": 201.3,
"r_y2": 229.7,
"r_x3": 196.1,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u6570",
"orig": "\u6570",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 209.6,
"t": 229.7,
"r": 220.0,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.6,
"r_y0": 233.8,
"r_x1": 220.0,
"r_y1": 233.8,
"r_x2": 220.0,
"r_y2": 229.7,
"r_x3": 209.6,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 229.2,
"t": 229.7,
"r": 244.8,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 229.2,
"r_y0": 233.8,
"r_x1": 244.8,
"r_y1": 233.8,
"r_x2": 244.8,
"r_y2": 229.7,
"r_x3": 229.2,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 256.1,
"t": 229.7,
"r": 266.5,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.1,
"r_y0": 233.8,
"r_x1": 266.5,
"r_y1": 233.8,
"r_x2": 266.5,
"r_y2": 229.7,
"r_x3": 256.1,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u82f1\u8a9e",
"orig": "\u82f1\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 278.4,
"t": 229.7,
"r": 293.9,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.4,
"r_y0": 233.8,
"r_x1": 293.9,
"r_y1": 233.8,
"r_x2": 293.9,
"r_y2": 229.7,
"r_x3": 278.4,
"r_y3": 229.7,
"coord_origin": "TOPLEFT"
},
"text": "\u65e5\u672c\u8a9e",
"orig": "\u65e5\u672c\u8a9e",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 55.5,
"t": 236.4,
"r": 162.7,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 240.8,
"r_x1": 162.7,
"r_y1": 240.8,
"r_x2": 162.7,
"r_y2": 236.4,
"r_x3": 55.5,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "Association for Computational Linguistics(ACL2003)",
"orig": "Association for Computational Linguistics(ACL2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 184.4,
"t": 236.4,
"r": 189.6,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 240.8,
"r_x1": 189.6,
"r_y1": 240.8,
"r_x2": 189.6,
"r_y2": 236.4,
"r_x3": 184.4,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 209.0,
"t": 236.4,
"r": 214.2,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 240.8,
"r_x1": 214.2,
"r_y1": 240.8,
"r_x2": 214.2,
"r_y2": 236.4,
"r_x3": 209.0,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 234.9,
"t": 236.4,
"r": 237.5,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.9,
"r_y0": 240.8,
"r_x1": 237.5,
"r_y1": 240.8,
"r_x2": 237.5,
"r_y2": 236.4,
"r_x3": 234.9,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 256.9,
"t": 236.4,
"r": 264.6,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 240.8,
"r_x1": 264.6,
"r_y1": 240.8,
"r_x2": 264.6,
"r_y2": 236.4,
"r_x3": 256.9,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 284.1,
"t": 236.4,
"r": 286.6,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.1,
"r_y0": 240.8,
"r_x1": 286.6,
"r_y1": 240.8,
"r_x2": 286.6,
"r_y2": 236.4,
"r_x3": 284.1,
"r_y3": 236.4,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 55.5,
"t": 242.6,
"r": 139.7,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 247.0,
"r_x1": 139.7,
"r_y1": 247.0,
"r_x2": 139.7,
"r_y2": 242.6,
"r_x3": 55.5,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "Computational Linguistics(COLING2002)",
"orig": "Computational Linguistics(COLING2002)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 183.1,
"t": 242.6,
"r": 190.9,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 247.0,
"r_x1": 190.9,
"r_y1": 247.0,
"r_x2": 190.9,
"r_y2": 242.6,
"r_x3": 183.1,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 207.7,
"t": 242.6,
"r": 215.4,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 247.0,
"r_x1": 215.4,
"r_y1": 247.0,
"r_x2": 215.4,
"r_y2": 242.6,
"r_x3": 207.7,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "140",
"orig": "140",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 234.9,
"t": 242.6,
"r": 237.5,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 234.9,
"r_y0": 247.0,
"r_x1": 237.5,
"r_y1": 247.0,
"r_x2": 237.5,
"r_y2": 242.6,
"r_x3": 234.9,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 256.9,
"t": 242.6,
"r": 264.6,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 247.0,
"r_x1": 264.6,
"r_y1": 247.0,
"r_x2": 264.6,
"r_y2": 242.6,
"r_x3": 256.9,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 284.1,
"t": 242.6,
"r": 286.6,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 284.1,
"r_y0": 247.0,
"r_x1": 286.6,
"r_y1": 247.0,
"r_x2": 286.6,
"r_y2": 242.6,
"r_x3": 284.1,
"r_y3": 242.6,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 55.5,
"t": 249.8,
"r": 97.0,
"b": 254.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 254.0,
"r_x1": 97.0,
"r_y1": 254.0,
"r_x2": 97.0,
"r_y2": 249.8,
"r_x3": 55.5,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 92.7,
"t": 249.6,
"r": 103.0,
"b": 253.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 92.7,
"r_y0": 253.9,
"r_x1": 103.0,
"r_y1": 253.9,
"r_x2": 103.0,
"r_y2": 249.6,
"r_x3": 92.7,
"r_y3": 249.6,
"coord_origin": "TOPLEFT"
},
"text": "2003",
"orig": "2003",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 103.0,
"t": 249.8,
"r": 129.0,
"b": 254.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.0,
"r_y0": 254.0,
"r_x1": 129.0,
"r_y1": 254.0,
"r_x2": 129.0,
"r_y2": 249.8,
"r_x3": 103.0,
"r_y3": 249.8,
"coord_origin": "TOPLEFT"
},
"text": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"orig": "\u5e74\u7dcf\u5408\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 183.1,
"t": 248.8,
"r": 190.9,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 253.2,
"r_x1": 190.9,
"r_y1": 253.2,
"r_x2": 190.9,
"r_y2": 248.8,
"r_x3": 183.1,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 210.3,
"t": 248.8,
"r": 212.9,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 253.2,
"r_x1": 212.9,
"r_y1": 253.2,
"r_x2": 212.9,
"r_y2": 248.8,
"r_x3": 210.3,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 232.3,
"t": 248.8,
"r": 240.0,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 253.2,
"r_x1": 240.0,
"r_y1": 253.2,
"r_x2": 240.0,
"r_y2": 248.8,
"r_x3": 232.3,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "142",
"orig": "142",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 256.9,
"t": 248.8,
"r": 264.6,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 253.2,
"r_x1": 264.6,
"r_y1": 253.2,
"r_x2": 264.6,
"r_y2": 248.8,
"r_x3": 256.9,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "223",
"orig": "223",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 83,
"label": "text",
"bbox": {
"l": 281.5,
"t": 248.8,
"r": 289.2,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 253.2,
"r_x1": 289.2,
"r_y1": 253.2,
"r_x2": 289.2,
"r_y2": 248.8,
"r_x3": 281.5,
"r_y3": 248.8,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 55.5,
"t": 257.3,
"r": 91.8,
"b": 261.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 261.5,
"r_x1": 91.8,
"r_y1": 261.5,
"r_x2": 91.8,
"r_y2": 257.3,
"r_x3": 55.5,
"r_y3": 257.3,
"coord_origin": "TOPLEFT"
},
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 88.1,
"t": 257.1,
"r": 93.2,
"b": 261.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 88.1,
"r_y0": 261.4,
"r_x1": 93.2,
"r_y1": 261.4,
"r_x2": 93.2,
"r_y2": 257.1,
"r_x3": 88.1,
"r_y3": 257.1,
"coord_origin": "TOPLEFT"
},
"text": "65",
"orig": "65",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 93.2,
"t": 257.3,
"r": 119.1,
"b": 261.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.2,
"r_y0": 261.5,
"r_x1": 119.1,
"r_y1": 261.5,
"r_x2": 119.1,
"r_y2": 257.3,
"r_x3": 93.2,
"r_y3": 257.3,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 116.5,
"t": 257.1,
"r": 129.9,
"b": 261.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.5,
"r_y0": 261.4,
"r_x1": 129.9,
"r_y1": 261.4,
"r_x2": 129.9,
"r_y2": 257.1,
"r_x3": 116.5,
"r_y3": 257.1,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 183.1,
"t": 256.3,
"r": 190.9,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 260.7,
"r_x1": 190.9,
"r_y1": 260.7,
"r_x2": 190.9,
"r_y2": 256.3,
"r_x3": 183.1,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "177",
"orig": "177",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 210.3,
"t": 256.3,
"r": 212.9,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 260.7,
"r_x1": 212.9,
"r_y1": 260.7,
"r_x2": 212.9,
"r_y2": 256.3,
"r_x3": 210.3,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 232.3,
"t": 256.3,
"r": 240.0,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 260.7,
"r_x1": 240.0,
"r_y1": 260.7,
"r_x2": 240.0,
"r_y2": 256.3,
"r_x3": 232.3,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "176",
"orig": "176",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 256.9,
"t": 256.3,
"r": 264.6,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 260.7,
"r_x1": 264.6,
"r_y1": 260.7,
"r_x2": 264.6,
"r_y2": 256.3,
"r_x3": 256.9,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 281.5,
"t": 256.3,
"r": 289.2,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 260.7,
"r_x1": 289.2,
"r_y1": 260.7,
"r_x2": 289.2,
"r_y2": 256.3,
"r_x3": 281.5,
"r_y3": 256.3,
"coord_origin": "TOPLEFT"
},
"text": "236",
"orig": "236",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 55.5,
"t": 264.5,
"r": 60.7,
"b": 268.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 268.7,
"r_x1": 60.7,
"r_y1": 268.7,
"r_x2": 60.7,
"r_y2": 264.5,
"r_x3": 55.5,
"r_y3": 264.5,
"coord_origin": "TOPLEFT"
},
"text": "\u7b2c",
"orig": "\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 60.2,
"t": 264.3,
"r": 65.3,
"b": 268.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.2,
"r_y0": 268.7,
"r_x1": 65.3,
"r_y1": 268.7,
"r_x2": 65.3,
"r_y2": 264.3,
"r_x3": 60.2,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 65.3,
"t": 264.5,
"r": 122.4,
"b": 268.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 65.3,
"r_y0": 268.7,
"r_x1": 122.4,
"r_y1": 268.7,
"r_x2": 122.4,
"r_y2": 264.5,
"r_x3": 65.3,
"r_y3": 264.5,
"coord_origin": "TOPLEFT"
},
"text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 116.5,
"t": 264.3,
"r": 129.9,
"b": 268.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.5,
"r_y0": 268.7,
"r_x1": 129.9,
"r_y1": 268.7,
"r_x2": 129.9,
"r_y2": 264.3,
"r_x3": 116.5,
"r_y3": 264.3,
"coord_origin": "TOPLEFT"
},
"text": "(2003)",
"orig": "(2003)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 183.1,
"t": 263.5,
"r": 190.9,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 267.9,
"r_x1": 190.9,
"r_y1": 267.9,
"r_x2": 190.9,
"r_y2": 263.5,
"r_x3": 183.1,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "208",
"orig": "208",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 210.3,
"t": 263.5,
"r": 212.9,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 267.9,
"r_x1": 212.9,
"r_y1": 267.9,
"r_x2": 212.9,
"r_y2": 263.5,
"r_x3": 210.3,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 99,
"label": "text",
"bbox": {
"l": 232.3,
"t": 263.5,
"r": 240.0,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 267.9,
"r_x1": 240.0,
"r_y1": 267.9,
"r_x2": 240.0,
"r_y2": 263.5,
"r_x3": 232.3,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "203",
"orig": "203",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 256.9,
"t": 263.5,
"r": 264.6,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 267.9,
"r_x1": 264.6,
"r_y1": 267.9,
"r_x2": 264.6,
"r_y2": 263.5,
"r_x3": 256.9,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "152",
"orig": "152",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 281.5,
"t": 263.5,
"r": 289.2,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 267.9,
"r_x1": 289.2,
"r_y1": 267.9,
"r_x2": 289.2,
"r_y2": 263.5,
"r_x3": 281.5,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "244",
"orig": "244",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 55.5,
"t": 271.7,
"r": 107.4,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 275.9,
"r_x1": 107.4,
"r_y1": 275.9,
"r_x2": 107.4,
"r_y2": 271.7,
"r_x3": 55.5,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 102.0,
"t": 271.5,
"r": 109.7,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 102.0,
"r_y0": 275.9,
"r_x1": 109.7,
"r_y1": 275.9,
"r_x2": 109.7,
"r_y2": 271.5,
"r_x3": 102.0,
"r_y3": 271.5,
"coord_origin": "TOPLEFT"
},
"text": "146",
"orig": "146",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 109.7,
"t": 271.7,
"r": 114.9,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 109.7,
"r_y0": 275.9,
"r_x1": 114.9,
"r_y1": 275.9,
"r_x2": 114.9,
"r_y2": 271.7,
"r_x3": 109.7,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u301c",
"orig": "\u301c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 105,
"label": "text",
"bbox": {
"l": 114.4,
"t": 271.5,
"r": 122.1,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 114.4,
"r_y0": 275.9,
"r_x1": 122.1,
"r_y1": 275.9,
"r_x2": 122.1,
"r_y2": 271.5,
"r_x3": 114.4,
"r_y3": 271.5,
"coord_origin": "TOPLEFT"
},
"text": "155",
"orig": "155",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 106,
"label": "text",
"bbox": {
"l": 122.1,
"t": 271.7,
"r": 127.3,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.1,
"r_y0": 275.9,
"r_x1": 127.3,
"r_y1": 275.9,
"r_x2": 127.3,
"r_y2": 271.7,
"r_x3": 122.1,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "\u56de",
"orig": "\u56de",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 107,
"label": "text",
"bbox": {
"l": 184.4,
"t": 270.8,
"r": 189.6,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 184.4,
"r_y0": 275.1,
"r_x1": 189.6,
"r_y1": 275.1,
"r_x2": 189.6,
"r_y2": 270.8,
"r_x3": 184.4,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "98",
"orig": "98",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 108,
"label": "text",
"bbox": {
"l": 210.3,
"t": 270.8,
"r": 212.9,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.3,
"r_y0": 275.1,
"r_x1": 212.9,
"r_y1": 275.1,
"r_x2": 212.9,
"r_y2": 270.8,
"r_x3": 210.3,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 109,
"label": "text",
"bbox": {
"l": 233.6,
"t": 270.8,
"r": 238.8,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.6,
"r_y0": 275.1,
"r_x1": 238.8,
"r_y1": 275.1,
"r_x2": 238.8,
"r_y2": 270.8,
"r_x3": 233.6,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 110,
"label": "text",
"bbox": {
"l": 256.9,
"t": 270.8,
"r": 264.6,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 275.1,
"r_x1": 264.6,
"r_y1": 275.1,
"r_x2": 264.6,
"r_y2": 270.8,
"r_x3": 256.9,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "150",
"orig": "150",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 111,
"label": "text",
"bbox": {
"l": 281.5,
"t": 270.8,
"r": 289.2,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 275.1,
"r_x1": 289.2,
"r_y1": 275.1,
"r_x2": 289.2,
"r_y2": 270.8,
"r_x3": 281.5,
"r_y3": 270.8,
"coord_origin": "TOPLEFT"
},
"text": "232",
"orig": "232",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 112,
"label": "text",
"bbox": {
"l": 55.5,
"t": 279.0,
"r": 68.7,
"b": 283.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 55.5,
"r_y0": 283.4,
"r_x1": 68.7,
"r_y1": 283.4,
"r_x2": 68.7,
"r_y2": 279.0,
"r_x3": 55.5,
"r_y3": 279.0,
"coord_origin": "TOPLEFT"
},
"text": "WWW",
"orig": "WWW",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 113,
"label": "text",
"bbox": {
"l": 68.7,
"t": 279.2,
"r": 110.2,
"b": 283.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.7,
"r_y0": 283.4,
"r_x1": 110.2,
"r_y1": 283.4,
"r_x2": 110.2,
"r_y2": 279.2,
"r_x3": 68.7,
"r_y3": 279.2,
"coord_origin": "TOPLEFT"
},
"text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 114,
"label": "text",
"bbox": {
"l": 183.1,
"t": 278.0,
"r": 190.9,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 282.3,
"r_x1": 190.9,
"r_y1": 282.3,
"r_x2": 190.9,
"r_y2": 278.0,
"r_x3": 183.1,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "107",
"orig": "107",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 115,
"label": "text",
"bbox": {
"l": 209.0,
"t": 278.0,
"r": 214.2,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 282.3,
"r_x1": 214.2,
"r_y1": 282.3,
"r_x2": 214.2,
"r_y2": 278.0,
"r_x3": 209.0,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "73",
"orig": "73",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 116,
"label": "text",
"bbox": {
"l": 233.6,
"t": 278.0,
"r": 238.8,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 233.6,
"r_y0": 282.3,
"r_x1": 238.8,
"r_y1": 282.3,
"r_x2": 238.8,
"r_y2": 278.0,
"r_x3": 233.6,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 117,
"label": "text",
"bbox": {
"l": 256.9,
"t": 278.0,
"r": 264.6,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 256.9,
"r_y0": 282.3,
"r_x1": 264.6,
"r_y1": 282.3,
"r_x2": 264.6,
"r_y2": 278.0,
"r_x3": 256.9,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "147",
"orig": "147",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 118,
"label": "text",
"bbox": {
"l": 282.8,
"t": 278.0,
"r": 287.9,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 282.8,
"r_y0": 282.3,
"r_x1": 287.9,
"r_y1": 282.3,
"r_x2": 287.9,
"r_y2": 278.0,
"r_x3": 282.8,
"r_y3": 278.0,
"coord_origin": "TOPLEFT"
},
"text": "96",
"orig": "96",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 119,
"label": "text",
"bbox": {
"l": 169.6,
"t": 286.5,
"r": 174.8,
"b": 290.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 169.6,
"r_y0": 290.6,
"r_x1": 174.8,
"r_y1": 290.6,
"r_x2": 174.8,
"r_y2": 286.5,
"r_x3": 169.6,
"r_y3": 286.5,
"coord_origin": "TOPLEFT"
},
"text": "\u8a08",
"orig": "\u8a08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 120,
"label": "text",
"bbox": {
"l": 183.1,
"t": 285.5,
"r": 190.9,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 183.1,
"r_y0": 289.8,
"r_x1": 190.9,
"r_y1": 289.8,
"r_x2": 190.9,
"r_y2": 285.5,
"r_x3": 183.1,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "945",
"orig": "945",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 121,
"label": "text",
"bbox": {
"l": 207.7,
"t": 285.5,
"r": 215.4,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.7,
"r_y0": 289.8,
"r_x1": 215.4,
"r_y1": 289.8,
"r_x2": 215.4,
"r_y2": 285.5,
"r_x3": 207.7,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "294",
"orig": "294",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 122,
"label": "text",
"bbox": {
"l": 232.3,
"t": 285.5,
"r": 240.0,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.3,
"r_y0": 289.8,
"r_x1": 240.0,
"r_y1": 289.8,
"r_x2": 240.0,
"r_y2": 285.5,
"r_x3": 232.3,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "651",
"orig": "651",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 123,
"label": "text",
"bbox": {
"l": 255.8,
"t": 285.5,
"r": 265.8,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 255.8,
"r_y0": 289.8,
"r_x1": 265.8,
"r_y1": 289.8,
"r_x2": 265.8,
"r_y2": 285.5,
"r_x3": 255.8,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "1122",
"orig": "1122",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 124,
"label": "text",
"bbox": {
"l": 281.5,
"t": 285.5,
"r": 289.2,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 281.5,
"r_y0": 289.8,
"r_x1": 289.2,
"r_y1": 289.8,
"r_x2": 289.2,
"r_y2": 285.5,
"r_x3": 281.5,
"r_y3": 285.5,
"coord_origin": "TOPLEFT"
},
"text": "955",
"orig": "955",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"lcel",
"ched",
"lcel",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 10,
"num_cols": 6,
"table_cells": [
{
"bbox": {
"l": 209.9,
"t": 222.2,
"r": 241.0,
"b": 226.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 2,
"end_col_offset_idx": 4,
"text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 263.8,
"t": 222.2,
"r": 284.5,
"b": 226.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 4,
"end_col_offset_idx": 6,
"text": "\u53c2\u8003\u6587\u732e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 110.2,
"t": 229.7,
"r": 120.6,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u51fa\u5178",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 175.4,
"t": 229.7,
"r": 196.1,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "\u30d5\u30a1\u30a4\u30eb \u6570",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 209.6,
"t": 229.7,
"r": 220.0,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "\u82f1\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 229.2,
"t": 229.7,
"r": 244.8,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "\u65e5\u672c\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.1,
"t": 229.7,
"r": 266.5,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "\u82f1\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 278.4,
"t": 229.7,
"r": 293.9,
"b": 233.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "\u65e5\u672c\u8a9e",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.5,
"t": 236.4,
"r": 162.7,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Association for Computational Linguistics(ACL2003)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 184.4,
"t": 236.4,
"r": 189.6,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "65",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 209.0,
"t": 236.4,
"r": 214.2,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "65",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 234.9,
"t": 236.4,
"r": 237.5,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.9,
"t": 236.4,
"r": 264.6,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 284.1,
"t": 236.4,
"r": 286.6,
"b": 240.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.5,
"t": 242.6,
"r": 139.7,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Computational Linguistics(COLING2002)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.1,
"t": 242.6,
"r": 190.9,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "140",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 207.7,
"t": 242.6,
"r": 215.4,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "140",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 234.9,
"t": 242.6,
"r": 237.5,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.9,
"t": 242.6,
"r": 264.6,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 284.1,
"t": 242.6,
"r": 286.6,
"b": 247.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.5,
"t": 249.8,
"r": 97.0,
"b": 254.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a 2003 \u5e74\u7dcf\u5408\u5927\u4f1a",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.1,
"t": 248.8,
"r": 190.9,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.3,
"t": 248.8,
"r": 212.9,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "8",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.3,
"t": 248.8,
"r": 240.0,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "142",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.9,
"t": 248.8,
"r": 264.6,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "223",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.5,
"t": 248.8,
"r": 289.2,
"b": 253.2,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "147",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.5,
"t": 257.3,
"r": 91.8,
"b": 261.5,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c 65 \u56de\u5168\u56fd\u5927\u4f1a (2003)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.1,
"t": 256.3,
"r": 190.9,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "177",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.3,
"t": 256.3,
"r": 212.9,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.3,
"t": 256.3,
"r": 240.0,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "176",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.9,
"t": 256.3,
"r": 264.6,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.5,
"t": 256.3,
"r": 289.2,
"b": 260.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "236",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.5,
"t": 264.5,
"r": 60.7,
"b": 268.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u7b2c 17 \u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a (2003)",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.1,
"t": 263.5,
"r": 190.9,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "208",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.3,
"t": 263.5,
"r": 212.9,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.3,
"t": 263.5,
"r": 240.0,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "203",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.9,
"t": 263.5,
"r": 264.6,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "152",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.5,
"t": 263.5,
"r": 289.2,
"b": 267.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "244",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.5,
"t": 271.7,
"r": 107.4,
"b": 275.9,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c 146 \u301c 155 \u56de",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 184.4,
"t": 270.8,
"r": 189.6,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "98",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 210.3,
"t": 270.8,
"r": 212.9,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 233.6,
"t": 270.8,
"r": 238.8,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "96",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.9,
"t": 270.8,
"r": 264.6,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "150",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.5,
"t": 270.8,
"r": 289.2,
"b": 275.1,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 7,
"end_row_offset_idx": 8,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "232",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 55.5,
"t": 279.0,
"r": 68.7,
"b": 283.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "WWW \u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.1,
"t": 278.0,
"r": 190.9,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "107",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 209.0,
"t": 278.0,
"r": 214.2,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "73",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 233.6,
"t": 278.0,
"r": 238.8,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "34",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 256.9,
"t": 278.0,
"r": 264.6,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "147",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 282.8,
"t": 278.0,
"r": 287.9,
"b": 282.3,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 8,
"end_row_offset_idx": 9,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "96",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 169.6,
"t": 286.5,
"r": 174.8,
"b": 290.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "\u8a08",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 183.1,
"t": 285.5,
"r": 190.9,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "945",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 207.7,
"t": 285.5,
"r": 215.4,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "294",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 232.3,
"t": 285.5,
"r": 240.0,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "651",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 255.8,
"t": 285.5,
"r": 265.8,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "1122",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 281.5,
"t": 285.5,
"r": 289.2,
"b": 289.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 9,
"end_row_offset_idx": 10,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "955",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 16,
"page_no": 7,
"cluster": {
"id": 16,
"label": "caption",
"bbox": {
"l": 380.4,
"t": 292.3,
"r": 549.4,
"b": 298.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.75,
"cells": [
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 380.4,
"r_y0": 298.6,
"r_x1": 549.4,
"r_y1": 298.6,
"r_x2": 549.4,
"r_y2": 292.3,
"r_x3": 380.4,
"r_y3": 292.3,
"coord_origin": "TOPLEFT"
},
"text": "Text is aligned to match original for ease of viewing",
"orig": "Text is aligned to match original for ease of viewing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Text is aligned to match original for ease of viewing"
},
{
"label": "table",
"id": 7,
"page_no": 7,
"cluster": {
"id": 7,
"label": "table",
"bbox": {
"l": 304.9,
"t": 218.5,
"r": 550.2,
"b": 287.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.0,
"r_y0": 226.7,
"r_x1": 542.0,
"r_y1": 226.7,
"r_x2": 542.0,
"r_y2": 221.6,
"r_x3": 459.0,
"r_y3": 221.6,
"coord_origin": "TOPLEFT"
},
"text": "Weighted Average Grant Date Fair",
"orig": "Weighted Average Grant Date Fair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.8,
"r_y0": 232.9,
"r_x1": 507.2,
"r_y1": 232.9,
"r_x2": 507.2,
"r_y2": 227.8,
"r_x3": 493.8,
"r_y3": 227.8,
"coord_origin": "TOPLEFT"
},
"text": "Value",
"orig": "Value",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.2,
"r_y0": 241.8,
"r_x1": 400.7,
"r_y1": 241.8,
"r_x2": 400.7,
"r_y2": 236.7,
"r_x3": 393.2,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "RS",
"orig": "RS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 241.8,
"r_x1": 404.6,
"r_y1": 241.8,
"r_x2": 404.6,
"r_y2": 236.7,
"r_x3": 400.7,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "U",
"orig": "U",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 404.6,
"r_y0": 241.8,
"r_x1": 407.3,
"r_y1": 241.8,
"r_x2": 407.3,
"r_y2": 236.7,
"r_x3": 404.6,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "s",
"orig": "s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 392.1,
"r_y0": 226.6,
"r_x1": 438.0,
"r_y1": 226.6,
"r_x2": 438.0,
"r_y2": 221.6,
"r_x3": 392.1,
"r_y3": 221.6,
"coord_origin": "TOPLEFT"
},
"text": "Shares (in millions)",
"orig": "Shares (in millions)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.2,
"r_y0": 241.8,
"r_x1": 441.0,
"r_y1": 241.8,
"r_x2": 441.0,
"r_y2": 236.7,
"r_x3": 427.2,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.4,
"r_y0": 241.8,
"r_x1": 482.5,
"r_y1": 241.8,
"r_x2": 482.5,
"r_y2": 236.7,
"r_x3": 468.4,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "RSUs",
"orig": "RSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.9,
"r_y0": 241.8,
"r_x1": 530.7,
"r_y1": 241.8,
"r_x2": 530.7,
"r_y2": 236.7,
"r_x3": 516.9,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 249.7,
"r_x1": 355.7,
"r_y1": 249.7,
"r_x2": 355.7,
"r_y2": 244.6,
"r_x3": 306.1,
"r_y3": 244.6,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on Janua",
"orig": "Nonvested on Janua",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 355.7,
"r_y0": 249.7,
"r_x1": 364.7,
"r_y1": 249.7,
"r_x2": 364.7,
"r_y2": 244.6,
"r_x3": 355.7,
"r_y3": 244.6,
"coord_origin": "TOPLEFT"
},
"text": "ry 1",
"orig": "ry 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 250.0,
"r_x1": 400.8,
"r_y1": 250.0,
"r_x2": 400.8,
"r_y2": 244.9,
"r_x3": 396.2,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.8,
"r_y0": 250.0,
"r_x1": 403.8,
"r_y1": 250.0,
"r_x2": 403.8,
"r_y2": 244.9,
"r_x3": 400.8,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.8,
"r_y0": 250.0,
"r_x1": 437.3,
"r_y1": 250.0,
"r_x2": 437.3,
"r_y2": 244.9,
"r_x3": 429.8,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.5,
"r_y0": 250.0,
"r_x1": 478.4,
"r_y1": 250.0,
"r_x2": 478.4,
"r_y2": 244.9,
"r_x3": 465.5,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "90.10",
"orig": "90.10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 481.0,
"r_y0": 250.0,
"r_x1": 483.6,
"r_y1": 250.0,
"r_x2": 483.6,
"r_y2": 244.9,
"r_x3": 481.0,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "$",
"orig": "$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.4,
"r_y0": 250.0,
"r_x1": 531.5,
"r_y1": 250.0,
"r_x2": 531.5,
"r_y2": 244.9,
"r_x3": 513.4,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "$ 91.19",
"orig": "$ 91.19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 258.7,
"r_x1": 325.6,
"r_y1": 258.7,
"r_x2": 325.6,
"r_y2": 253.7,
"r_x3": 306.1,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Granted",
"orig": "Granted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 258.7,
"r_x1": 400.8,
"r_y1": 258.7,
"r_x2": 400.8,
"r_y2": 253.7,
"r_x3": 396.2,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "0.",
"orig": "0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.8,
"r_y0": 258.7,
"r_x1": 403.8,
"r_y1": 258.7,
"r_x2": 403.8,
"r_y2": 253.7,
"r_x3": 400.8,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.8,
"r_y0": 258.7,
"r_x1": 437.3,
"r_y1": 258.7,
"r_x2": 437.3,
"r_y2": 253.7,
"r_x3": 429.8,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "0.1",
"orig": "0.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.4,
"r_y0": 258.7,
"r_x1": 482.5,
"r_y1": 258.7,
"r_x2": 482.5,
"r_y2": 253.7,
"r_x3": 466.4,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "117.44",
"orig": "117.44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.3,
"r_y0": 258.7,
"r_x1": 530.8,
"r_y1": 258.7,
"r_x2": 530.8,
"r_y2": 253.7,
"r_x3": 514.3,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "122.41",
"orig": "122.41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 266.6,
"r_x1": 322.6,
"r_y1": 266.6,
"r_x2": 322.6,
"r_y2": 261.5,
"r_x3": 306.1,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "Vested",
"orig": "Vested",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.4,
"r_y0": 266.6,
"r_x1": 400.7,
"r_y1": 266.6,
"r_x2": 400.7,
"r_y2": 261.5,
"r_x3": 394.4,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 266.6,
"r_x1": 403.7,
"r_y1": 266.6,
"r_x2": 403.7,
"r_y2": 261.5,
"r_x3": 400.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.7,
"r_y0": 266.6,
"r_x1": 405.5,
"r_y1": 266.6,
"r_x2": 405.5,
"r_y2": 261.5,
"r_x3": 403.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.7,
"r_y0": 266.6,
"r_x1": 438.8,
"r_y1": 266.6,
"r_x2": 438.8,
"r_y2": 261.5,
"r_x3": 427.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "(0.1)",
"orig": "(0.1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.6,
"r_y0": 266.6,
"r_x1": 482.1,
"r_y1": 266.6,
"r_x2": 482.1,
"r_y2": 261.5,
"r_x3": 468.6,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "87.08",
"orig": "87.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.0,
"r_y0": 266.6,
"r_x1": 529.5,
"r_y1": 266.6,
"r_x2": 529.5,
"r_y2": 261.5,
"r_x3": 516.0,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "81.14",
"orig": "81.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 274.7,
"r_x1": 356.2,
"r_y1": 274.7,
"r_x2": 356.2,
"r_y2": 269.6,
"r_x3": 306.1,
"r_y3": 269.6,
"coord_origin": "TOPLEFT"
},
"text": "Canceled or forfeited",
"orig": "Canceled or forfeited",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.4,
"r_y0": 275.4,
"r_x1": 400.7,
"r_y1": 275.4,
"r_x2": 400.7,
"r_y2": 270.3,
"r_x3": 394.4,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 275.4,
"r_x1": 403.7,
"r_y1": 275.4,
"r_x2": 403.7,
"r_y2": 270.3,
"r_x3": 400.7,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.7,
"r_y0": 275.4,
"r_x1": 405.5,
"r_y1": 275.4,
"r_x2": 405.5,
"r_y2": 270.3,
"r_x3": 403.7,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.0,
"r_y0": 275.4,
"r_x1": 436.4,
"r_y1": 275.4,
"r_x2": 436.4,
"r_y2": 270.3,
"r_x3": 431.0,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.8,
"r_y0": 275.4,
"r_x1": 482.4,
"r_y1": 275.4,
"r_x2": 482.4,
"r_y2": 270.3,
"r_x3": 465.8,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "102.01",
"orig": "102.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.0,
"r_y0": 275.4,
"r_x1": 529.5,
"r_y1": 275.4,
"r_x2": 529.5,
"r_y2": 270.3,
"r_x3": 516.0,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "92.18",
"orig": "92.18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 283.6,
"r_x1": 373.4,
"r_y1": 283.6,
"r_x2": 373.4,
"r_y2": 278.5,
"r_x3": 306.1,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on December 31",
"orig": "Nonvested on December 31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 283.6,
"r_x1": 403.8,
"r_y1": 283.6,
"r_x2": 403.8,
"r_y2": 278.5,
"r_x3": 396.2,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "1.0",
"orig": "1.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.5,
"r_y0": 283.6,
"r_x1": 437.0,
"r_y1": 283.6,
"r_x2": 437.0,
"r_y2": 278.5,
"r_x3": 429.5,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.7,
"r_y0": 283.6,
"r_x1": 484.7,
"r_y1": 283.6,
"r_x2": 484.7,
"r_y2": 278.5,
"r_x3": 463.7,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "104.85 $",
"orig": "104.85 $",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.0,
"r_y0": 283.6,
"r_x1": 534.0,
"r_y1": 283.6,
"r_x2": 534.0,
"r_y2": 278.5,
"r_x3": 513.0,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "$ 104.51",
"orig": "$ 104.51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 125,
"label": "text",
"bbox": {
"l": 459.0,
"t": 221.6,
"r": 542.0,
"b": 226.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.0,
"r_y0": 226.7,
"r_x1": 542.0,
"r_y1": 226.7,
"r_x2": 542.0,
"r_y2": 221.6,
"r_x3": 459.0,
"r_y3": 221.6,
"coord_origin": "TOPLEFT"
},
"text": "Weighted Average Grant Date Fair",
"orig": "Weighted Average Grant Date Fair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 126,
"label": "text",
"bbox": {
"l": 493.8,
"t": 227.8,
"r": 507.2,
"b": 232.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 493.8,
"r_y0": 232.9,
"r_x1": 507.2,
"r_y1": 232.9,
"r_x2": 507.2,
"r_y2": 227.8,
"r_x3": 493.8,
"r_y3": 227.8,
"coord_origin": "TOPLEFT"
},
"text": "Value",
"orig": "Value",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 127,
"label": "text",
"bbox": {
"l": 393.2,
"t": 236.7,
"r": 400.7,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 393.2,
"r_y0": 241.8,
"r_x1": 400.7,
"r_y1": 241.8,
"r_x2": 400.7,
"r_y2": 236.7,
"r_x3": 393.2,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "RS",
"orig": "RS",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 128,
"label": "text",
"bbox": {
"l": 400.7,
"t": 236.7,
"r": 404.6,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 241.8,
"r_x1": 404.6,
"r_y1": 241.8,
"r_x2": 404.6,
"r_y2": 236.7,
"r_x3": 400.7,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "U",
"orig": "U",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 129,
"label": "text",
"bbox": {
"l": 404.6,
"t": 236.7,
"r": 407.3,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 404.6,
"r_y0": 241.8,
"r_x1": 407.3,
"r_y1": 241.8,
"r_x2": 407.3,
"r_y2": 236.7,
"r_x3": 404.6,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "s",
"orig": "s",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 130,
"label": "text",
"bbox": {
"l": 392.1,
"t": 221.6,
"r": 438.0,
"b": 226.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 392.1,
"r_y0": 226.6,
"r_x1": 438.0,
"r_y1": 226.6,
"r_x2": 438.0,
"r_y2": 221.6,
"r_x3": 392.1,
"r_y3": 221.6,
"coord_origin": "TOPLEFT"
},
"text": "Shares (in millions)",
"orig": "Shares (in millions)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 131,
"label": "text",
"bbox": {
"l": 427.2,
"t": 236.7,
"r": 441.0,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.2,
"r_y0": 241.8,
"r_x1": 441.0,
"r_y1": 241.8,
"r_x2": 441.0,
"r_y2": 236.7,
"r_x3": 427.2,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 132,
"label": "text",
"bbox": {
"l": 468.4,
"t": 236.7,
"r": 482.5,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.4,
"r_y0": 241.8,
"r_x1": 482.5,
"r_y1": 241.8,
"r_x2": 482.5,
"r_y2": 236.7,
"r_x3": 468.4,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "RSUs",
"orig": "RSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 133,
"label": "text",
"bbox": {
"l": 516.9,
"t": 236.7,
"r": 530.7,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.9,
"r_y0": 241.8,
"r_x1": 530.7,
"r_y1": 241.8,
"r_x2": 530.7,
"r_y2": 236.7,
"r_x3": 516.9,
"r_y3": 236.7,
"coord_origin": "TOPLEFT"
},
"text": "PSUs",
"orig": "PSUs",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 134,
"label": "text",
"bbox": {
"l": 306.1,
"t": 244.6,
"r": 355.7,
"b": 249.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 249.7,
"r_x1": 355.7,
"r_y1": 249.7,
"r_x2": 355.7,
"r_y2": 244.6,
"r_x3": 306.1,
"r_y3": 244.6,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on Janua",
"orig": "Nonvested on Janua",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 135,
"label": "text",
"bbox": {
"l": 355.7,
"t": 244.6,
"r": 364.7,
"b": 249.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 355.7,
"r_y0": 249.7,
"r_x1": 364.7,
"r_y1": 249.7,
"r_x2": 364.7,
"r_y2": 244.6,
"r_x3": 355.7,
"r_y3": 244.6,
"coord_origin": "TOPLEFT"
},
"text": "ry 1",
"orig": "ry 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 136,
"label": "text",
"bbox": {
"l": 396.2,
"t": 244.9,
"r": 400.8,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 250.0,
"r_x1": 400.8,
"r_y1": 250.0,
"r_x2": 400.8,
"r_y2": 244.9,
"r_x3": 396.2,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 137,
"label": "text",
"bbox": {
"l": 400.8,
"t": 244.9,
"r": 403.8,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.8,
"r_y0": 250.0,
"r_x1": 403.8,
"r_y1": 250.0,
"r_x2": 403.8,
"r_y2": 244.9,
"r_x3": 400.8,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 138,
"label": "text",
"bbox": {
"l": 429.8,
"t": 244.9,
"r": 437.3,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.8,
"r_y0": 250.0,
"r_x1": 437.3,
"r_y1": 250.0,
"r_x2": 437.3,
"r_y2": 244.9,
"r_x3": 429.8,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 139,
"label": "text",
"bbox": {
"l": 465.5,
"t": 244.9,
"r": 478.4,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.5,
"r_y0": 250.0,
"r_x1": 478.4,
"r_y1": 250.0,
"r_x2": 478.4,
"r_y2": 244.9,
"r_x3": 465.5,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "90.10",
"orig": "90.10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 140,
"label": "text",
"bbox": {
"l": 481.0,
"t": 244.9,
"r": 483.6,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 481.0,
"r_y0": 250.0,
"r_x1": 483.6,
"r_y1": 250.0,
"r_x2": 483.6,
"r_y2": 244.9,
"r_x3": 481.0,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "$",
"orig": "$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 141,
"label": "text",
"bbox": {
"l": 513.4,
"t": 244.9,
"r": 531.5,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.4,
"r_y0": 250.0,
"r_x1": 531.5,
"r_y1": 250.0,
"r_x2": 531.5,
"r_y2": 244.9,
"r_x3": 513.4,
"r_y3": 244.9,
"coord_origin": "TOPLEFT"
},
"text": "$ 91.19",
"orig": "$ 91.19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 142,
"label": "text",
"bbox": {
"l": 306.1,
"t": 253.7,
"r": 325.6,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 258.7,
"r_x1": 325.6,
"r_y1": 258.7,
"r_x2": 325.6,
"r_y2": 253.7,
"r_x3": 306.1,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "Granted",
"orig": "Granted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 143,
"label": "text",
"bbox": {
"l": 396.2,
"t": 253.7,
"r": 400.8,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 258.7,
"r_x1": 400.8,
"r_y1": 258.7,
"r_x2": 400.8,
"r_y2": 253.7,
"r_x3": 396.2,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "0.",
"orig": "0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 144,
"label": "text",
"bbox": {
"l": 400.8,
"t": 253.7,
"r": 403.8,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.8,
"r_y0": 258.7,
"r_x1": 403.8,
"r_y1": 258.7,
"r_x2": 403.8,
"r_y2": 253.7,
"r_x3": 400.8,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 145,
"label": "text",
"bbox": {
"l": 429.8,
"t": 253.7,
"r": 437.3,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.8,
"r_y0": 258.7,
"r_x1": 437.3,
"r_y1": 258.7,
"r_x2": 437.3,
"r_y2": 253.7,
"r_x3": 429.8,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "0.1",
"orig": "0.1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 146,
"label": "text",
"bbox": {
"l": 466.4,
"t": 253.7,
"r": 482.5,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.4,
"r_y0": 258.7,
"r_x1": 482.5,
"r_y1": 258.7,
"r_x2": 482.5,
"r_y2": 253.7,
"r_x3": 466.4,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "117.44",
"orig": "117.44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 147,
"label": "text",
"bbox": {
"l": 514.3,
"t": 253.7,
"r": 530.8,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 514.3,
"r_y0": 258.7,
"r_x1": 530.8,
"r_y1": 258.7,
"r_x2": 530.8,
"r_y2": 253.7,
"r_x3": 514.3,
"r_y3": 253.7,
"coord_origin": "TOPLEFT"
},
"text": "122.41",
"orig": "122.41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 148,
"label": "text",
"bbox": {
"l": 306.1,
"t": 261.5,
"r": 322.6,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 266.6,
"r_x1": 322.6,
"r_y1": 266.6,
"r_x2": 322.6,
"r_y2": 261.5,
"r_x3": 306.1,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "Vested",
"orig": "Vested",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 149,
"label": "text",
"bbox": {
"l": 394.4,
"t": 261.5,
"r": 400.7,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.4,
"r_y0": 266.6,
"r_x1": 400.7,
"r_y1": 266.6,
"r_x2": 400.7,
"r_y2": 261.5,
"r_x3": 394.4,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 150,
"label": "text",
"bbox": {
"l": 400.7,
"t": 261.5,
"r": 403.7,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 266.6,
"r_x1": 403.7,
"r_y1": 266.6,
"r_x2": 403.7,
"r_y2": 261.5,
"r_x3": 400.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 151,
"label": "text",
"bbox": {
"l": 403.7,
"t": 261.5,
"r": 405.5,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.7,
"r_y0": 266.6,
"r_x1": 405.5,
"r_y1": 266.6,
"r_x2": 405.5,
"r_y2": 261.5,
"r_x3": 403.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 152,
"label": "text",
"bbox": {
"l": 427.7,
"t": 261.5,
"r": 438.8,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 427.7,
"r_y0": 266.6,
"r_x1": 438.8,
"r_y1": 266.6,
"r_x2": 438.8,
"r_y2": 261.5,
"r_x3": 427.7,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "(0.1)",
"orig": "(0.1)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 153,
"label": "text",
"bbox": {
"l": 468.6,
"t": 261.5,
"r": 482.1,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 468.6,
"r_y0": 266.6,
"r_x1": 482.1,
"r_y1": 266.6,
"r_x2": 482.1,
"r_y2": 261.5,
"r_x3": 468.6,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "87.08",
"orig": "87.08",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 154,
"label": "text",
"bbox": {
"l": 516.0,
"t": 261.5,
"r": 529.5,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.0,
"r_y0": 266.6,
"r_x1": 529.5,
"r_y1": 266.6,
"r_x2": 529.5,
"r_y2": 261.5,
"r_x3": 516.0,
"r_y3": 261.5,
"coord_origin": "TOPLEFT"
},
"text": "81.14",
"orig": "81.14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 155,
"label": "text",
"bbox": {
"l": 306.1,
"t": 269.6,
"r": 356.2,
"b": 274.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 274.7,
"r_x1": 356.2,
"r_y1": 274.7,
"r_x2": 356.2,
"r_y2": 269.6,
"r_x3": 306.1,
"r_y3": 269.6,
"coord_origin": "TOPLEFT"
},
"text": "Canceled or forfeited",
"orig": "Canceled or forfeited",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 156,
"label": "text",
"bbox": {
"l": 394.4,
"t": 270.3,
"r": 400.7,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 394.4,
"r_y0": 275.4,
"r_x1": 400.7,
"r_y1": 275.4,
"r_x2": 400.7,
"r_y2": 270.3,
"r_x3": 394.4,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "(0.",
"orig": "(0.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 157,
"label": "text",
"bbox": {
"l": 400.7,
"t": 270.3,
"r": 403.7,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.7,
"r_y0": 275.4,
"r_x1": 403.7,
"r_y1": 275.4,
"r_x2": 403.7,
"r_y2": 270.3,
"r_x3": 400.7,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 158,
"label": "text",
"bbox": {
"l": 403.7,
"t": 270.3,
"r": 405.5,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.7,
"r_y0": 275.4,
"r_x1": 405.5,
"r_y1": 275.4,
"r_x2": 405.5,
"r_y2": 270.3,
"r_x3": 403.7,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": ")",
"orig": ")",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 159,
"label": "text",
"bbox": {
"l": 431.0,
"t": 270.3,
"r": 436.4,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.0,
"r_y0": 275.4,
"r_x1": 436.4,
"r_y1": 275.4,
"r_x2": 436.4,
"r_y2": 270.3,
"r_x3": 431.0,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "-",
"orig": "-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 160,
"label": "text",
"bbox": {
"l": 465.8,
"t": 270.3,
"r": 482.4,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 465.8,
"r_y0": 275.4,
"r_x1": 482.4,
"r_y1": 275.4,
"r_x2": 482.4,
"r_y2": 270.3,
"r_x3": 465.8,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "102.01",
"orig": "102.01",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 161,
"label": "text",
"bbox": {
"l": 516.0,
"t": 270.3,
"r": 529.5,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 516.0,
"r_y0": 275.4,
"r_x1": 529.5,
"r_y1": 275.4,
"r_x2": 529.5,
"r_y2": 270.3,
"r_x3": 516.0,
"r_y3": 270.3,
"coord_origin": "TOPLEFT"
},
"text": "92.18",
"orig": "92.18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 162,
"label": "text",
"bbox": {
"l": 306.1,
"t": 278.5,
"r": 373.4,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 306.1,
"r_y0": 283.6,
"r_x1": 373.4,
"r_y1": 283.6,
"r_x2": 373.4,
"r_y2": 278.5,
"r_x3": 306.1,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "Nonvested on December 31",
"orig": "Nonvested on December 31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 163,
"label": "text",
"bbox": {
"l": 396.2,
"t": 278.5,
"r": 403.8,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 283.6,
"r_x1": 403.8,
"r_y1": 283.6,
"r_x2": 403.8,
"r_y2": 278.5,
"r_x3": 396.2,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "1.0",
"orig": "1.0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 164,
"label": "text",
"bbox": {
"l": 429.5,
"t": 278.5,
"r": 437.0,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 429.5,
"r_y0": 283.6,
"r_x1": 437.0,
"r_y1": 283.6,
"r_x2": 437.0,
"r_y2": 278.5,
"r_x3": 429.5,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "0.3",
"orig": "0.3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 165,
"label": "text",
"bbox": {
"l": 463.7,
"t": 278.5,
"r": 484.7,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.7,
"r_y0": 283.6,
"r_x1": 484.7,
"r_y1": 283.6,
"r_x2": 484.7,
"r_y2": 278.5,
"r_x3": 463.7,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "104.85 $",
"orig": "104.85 $",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 166,
"label": "text",
"bbox": {
"l": 513.0,
"t": 278.5,
"r": 534.0,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 513.0,
"r_y0": 283.6,
"r_x1": 534.0,
"r_y1": 283.6,
"r_x2": 534.0,
"r_y2": 278.5,
"r_x3": 513.0,
"r_y3": 278.5,
"coord_origin": "TOPLEFT"
},
"text": "$ 104.51",
"orig": "$ 104.51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"lcel",
"ched",
"lcel",
"nl",
"ecel",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 7,
"num_cols": 5,
"table_cells": [
{
"bbox": {
"l": 459.0,
"t": 221.6,
"r": 542.0,
"b": 226.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 5,
"text": "Weighted Average Grant Date Fair Value",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 393.2,
"t": 236.7,
"r": 400.7,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "RS U s",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 392.1,
"t": 221.6,
"r": 438.0,
"b": 226.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 2,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 1,
"end_col_offset_idx": 3,
"text": "Shares (in millions)",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 427.2,
"t": 236.7,
"r": 441.0,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "PSUs",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 468.4,
"t": 236.7,
"r": 482.5,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "RSUs",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 516.9,
"t": 236.7,
"r": 530.7,
"b": 241.8,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "PSUs",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.1,
"t": 244.6,
"r": 355.7,
"b": 249.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Nonvested on Janua ry 1",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 396.2,
"t": 244.9,
"r": 400.8,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "1. 1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 429.8,
"t": 244.9,
"r": 437.3,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "0.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 465.5,
"t": 244.9,
"r": 478.4,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "90.10 $",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 513.4,
"t": 244.9,
"r": 531.5,
"b": 250.0,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "$ 91.19",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.1,
"t": 253.7,
"r": 325.6,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Granted",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 396.2,
"t": 253.7,
"r": 400.8,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "0. 5",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 429.8,
"t": 253.7,
"r": 437.3,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "0.1",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 466.4,
"t": 253.7,
"r": 482.5,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "117.44",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 514.3,
"t": 253.7,
"r": 530.8,
"b": 258.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "122.41",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.1,
"t": 261.5,
"r": 322.6,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Vested",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 394.4,
"t": 261.5,
"r": 400.7,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "(0. 5 )",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 427.7,
"t": 261.5,
"r": 438.8,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "(0.1)",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 468.6,
"t": 261.5,
"r": 482.1,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "87.08",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 516.0,
"t": 261.5,
"r": 529.5,
"b": 266.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "81.14",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.1,
"t": 269.6,
"r": 356.2,
"b": 274.7,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Canceled or forfeited",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 394.4,
"t": 270.3,
"r": 400.7,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "(0. 1 )",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 431.0,
"t": 270.3,
"r": 436.4,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "-",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 465.8,
"t": 270.3,
"r": 482.4,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "102.01",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 516.0,
"t": 270.3,
"r": 529.5,
"b": 275.4,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "92.18",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 306.1,
"t": 278.5,
"r": 373.4,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "Nonvested on December 31",
"column_header": false,
"row_header": true,
"row_section": false
},
{
"bbox": {
"l": 396.2,
"t": 278.5,
"r": 403.8,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "1.0",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 429.5,
"t": 278.5,
"r": 437.0,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "0.3",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 463.7,
"t": 278.5,
"r": 484.7,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "104.85 $",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 513.0,
"t": 278.5,
"r": 534.0,
"b": 283.6,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 6,
"end_row_offset_idx": 7,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "$ 104.51",
"column_header": false,
"row_header": false,
"row_section": false
}
]
},
{
"label": "caption",
"id": 6,
"page_no": 7,
"cluster": {
"id": 6,
"label": "caption",
"bbox": {
"l": 50.1,
"t": 320.9,
"r": 545.1,
"b": 365.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 329.8,
"r_x1": 86.9,
"r_y1": 329.8,
"r_x2": 86.9,
"r_y2": 320.9,
"r_x3": 50.1,
"r_y3": 320.9,
"coord_origin": "TOPLEFT"
},
"text": "Figure 5:",
"orig": "Figure 5:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 93.9,
"r_y0": 329.8,
"r_x1": 545.1,
"r_y1": 329.8,
"r_x2": 545.1,
"r_y2": 320.9,
"r_x3": 93.9,
"r_y3": 320.9,
"coord_origin": "TOPLEFT"
},
"text": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration",
"orig": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 341.7,
"r_x1": 545.1,
"r_y1": 341.7,
"r_x2": 545.1,
"r_y2": 332.8,
"r_x3": 50.1,
"r_y3": 332.8,
"coord_origin": "TOPLEFT"
},
"text": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is",
"orig": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 353.7,
"r_x1": 545.1,
"r_y1": 353.7,
"r_x2": 545.1,
"r_y2": 344.8,
"r_x3": 50.1,
"r_y3": 344.8,
"coord_origin": "TOPLEFT"
},
"text": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from",
"orig": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 365.6,
"r_x1": 139.8,
"r_y1": 365.6,
"r_x2": 139.8,
"r_y2": 356.7,
"r_x3": 50.1,
"r_y3": 356.7,
"coord_origin": "TOPLEFT"
},
"text": "the FinTabNet dataset.",
"orig": "the FinTabNet dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 5: One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from the FinTabNet dataset."
},
{
"label": "picture",
"id": 12,
"page_no": 7,
"cluster": {
"id": 12,
"label": "picture",
"bbox": {
"l": 216.8,
"t": 380.5,
"r": 375.8,
"b": 443.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.81,
"cells": [
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.3,
"r_y0": 386.4,
"r_x1": 342.1,
"r_y1": 386.4,
"r_x2": 342.1,
"r_y2": 381.8,
"r_x3": 220.3,
"r_y3": 381.8,
"coord_origin": "TOPLEFT"
},
"text": "Red - PDF cells, Green - predicted bounding boxes",
"orig": "Red - PDF cells, Green - predicted bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 167,
"label": "text",
"bbox": {
"l": 220.3,
"t": 381.8,
"r": 342.1,
"b": 386.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.3,
"r_y0": 386.4,
"r_x1": 342.1,
"r_y1": 386.4,
"r_x2": 342.1,
"r_y2": 381.8,
"r_x3": 220.3,
"r_y3": 381.8,
"coord_origin": "TOPLEFT"
},
"text": "Red - PDF cells, Green - predicted bounding boxes",
"orig": "Red - PDF cells, Green - predicted bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 11,
"page_no": 7,
"cluster": {
"id": 11,
"label": "picture",
"bbox": {
"l": 51.7,
"t": 380.5,
"r": 211.8,
"b": 443.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.83,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.7,
"r_y0": 386.4,
"r_x1": 85.7,
"r_y1": 386.4,
"r_x2": 85.7,
"r_y2": 381.8,
"r_x3": 53.7,
"r_y3": 381.8,
"coord_origin": "TOPLEFT"
},
"text": "Ground Truth",
"orig": "Ground Truth",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 168,
"label": "text",
"bbox": {
"l": 53.7,
"t": 381.8,
"r": 85.7,
"b": 386.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.7,
"r_y0": 386.4,
"r_x1": 85.7,
"r_y1": 386.4,
"r_x2": 85.7,
"r_y2": 381.8,
"r_x3": 53.7,
"r_y3": 381.8,
"coord_origin": "TOPLEFT"
},
"text": "Ground Truth",
"orig": "Ground Truth",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 13,
"page_no": 7,
"cluster": {
"id": 13,
"label": "picture",
"bbox": {
"l": 383.1,
"t": 381.2,
"r": 542.1,
"b": 442.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.79,
"cells": [
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 406.9,
"r_x1": 443.7,
"r_y1": 406.9,
"r_x2": 443.7,
"r_y2": 400.6,
"r_x3": 437.4,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 406.9,
"r_x1": 456.7,
"r_y1": 406.9,
"r_x2": 456.7,
"r_y2": 400.6,
"r_x3": 450.3,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 406.9,
"r_x1": 469.6,
"r_y1": 406.9,
"r_x2": 469.6,
"r_y2": 400.6,
"r_x3": 463.3,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 406.9,
"r_x1": 482.6,
"r_y1": 406.9,
"r_x2": 482.6,
"r_y2": 400.6,
"r_x3": 476.2,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 406.9,
"r_x1": 495.5,
"r_y1": 406.9,
"r_x2": 495.5,
"r_y2": 400.6,
"r_x3": 489.2,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 406.9,
"r_x1": 508.5,
"r_y1": 406.9,
"r_x2": 508.5,
"r_y2": 400.6,
"r_x3": 502.1,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "21",
"orig": "21",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 406.9,
"r_x1": 521.4,
"r_y1": 406.9,
"r_x2": 521.4,
"r_y2": 400.6,
"r_x3": 515.1,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "22",
"orig": "22",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 417.4,
"r_x1": 391.6,
"r_y1": 417.4,
"r_x2": 391.6,
"r_y2": 411.0,
"r_x3": 385.3,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "23",
"orig": "23",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 417.4,
"r_x1": 404.8,
"r_y1": 417.4,
"r_x2": 404.8,
"r_y2": 411.0,
"r_x3": 398.5,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "24",
"orig": "24",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 417.4,
"r_x1": 417.8,
"r_y1": 417.4,
"r_x2": 417.8,
"r_y2": 411.0,
"r_x3": 411.5,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "25",
"orig": "25",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 417.4,
"r_x1": 443.7,
"r_y1": 417.4,
"r_x2": 443.7,
"r_y2": 411.0,
"r_x3": 437.4,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "26",
"orig": "26",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 417.4,
"r_x1": 456.7,
"r_y1": 417.4,
"r_x2": 456.7,
"r_y2": 411.0,
"r_x3": 450.3,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "27",
"orig": "27",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 417.4,
"r_x1": 469.6,
"r_y1": 417.4,
"r_x2": 469.6,
"r_y2": 411.0,
"r_x3": 463.3,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "28",
"orig": "28",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 427.4,
"r_x1": 391.6,
"r_y1": 427.4,
"r_x2": 391.6,
"r_y2": 421.1,
"r_x3": 385.3,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 427.4,
"r_x1": 404.8,
"r_y1": 427.4,
"r_x2": 404.8,
"r_y2": 421.1,
"r_x3": 398.5,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "31",
"orig": "31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 427.4,
"r_x1": 417.8,
"r_y1": 427.4,
"r_x2": 417.8,
"r_y2": 421.1,
"r_x3": 411.5,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "32",
"orig": "32",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 427.4,
"r_x1": 430.7,
"r_y1": 427.4,
"r_x2": 430.7,
"r_y2": 421.1,
"r_x3": 424.4,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "33",
"orig": "33",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 427.4,
"r_x1": 443.7,
"r_y1": 427.4,
"r_x2": 443.7,
"r_y2": 421.1,
"r_x3": 437.4,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 427.4,
"r_x1": 456.7,
"r_y1": 427.4,
"r_x2": 456.7,
"r_y2": 421.1,
"r_x3": 450.3,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "35",
"orig": "35",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 427.4,
"r_x1": 469.6,
"r_y1": 427.4,
"r_x2": 469.6,
"r_y2": 421.1,
"r_x3": 463.3,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "36",
"orig": "36",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 427.4,
"r_x1": 482.6,
"r_y1": 427.4,
"r_x2": 482.6,
"r_y2": 421.1,
"r_x3": 476.2,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "37",
"orig": "37",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 427.4,
"r_x1": 495.5,
"r_y1": 427.4,
"r_x2": 495.5,
"r_y2": 421.1,
"r_x3": 489.2,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "38",
"orig": "38",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 427.4,
"r_x1": 508.5,
"r_y1": 427.4,
"r_x2": 508.5,
"r_y2": 421.1,
"r_x3": 502.1,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "39",
"orig": "39",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 427.4,
"r_x1": 521.4,
"r_y1": 427.4,
"r_x2": 521.4,
"r_y2": 421.1,
"r_x3": 515.1,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.0,
"r_y0": 427.4,
"r_x1": 534.4,
"r_y1": 427.4,
"r_x2": 534.4,
"r_y2": 421.1,
"r_x3": 528.0,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "41",
"orig": "41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 438.4,
"r_x1": 391.6,
"r_y1": 438.4,
"r_x2": 391.6,
"r_y2": 432.0,
"r_x3": 385.3,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "42",
"orig": "42",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 438.4,
"r_x1": 404.8,
"r_y1": 438.4,
"r_x2": 404.8,
"r_y2": 432.0,
"r_x3": 398.5,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "43",
"orig": "43",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 438.4,
"r_x1": 417.8,
"r_y1": 438.4,
"r_x2": 417.8,
"r_y2": 432.0,
"r_x3": 411.5,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "44",
"orig": "44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 438.4,
"r_x1": 430.7,
"r_y1": 438.4,
"r_x2": 430.7,
"r_y2": 432.0,
"r_x3": 424.4,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "45",
"orig": "45",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 438.4,
"r_x1": 443.7,
"r_y1": 438.4,
"r_x2": 443.7,
"r_y2": 432.0,
"r_x3": 437.4,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "46",
"orig": "46",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 438.4,
"r_x1": 456.7,
"r_y1": 438.4,
"r_x2": 456.7,
"r_y2": 432.0,
"r_x3": 450.3,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "47",
"orig": "47",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 438.4,
"r_x1": 469.6,
"r_y1": 438.4,
"r_x2": 469.6,
"r_y2": 432.0,
"r_x3": 463.3,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "48",
"orig": "48",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 438.4,
"r_x1": 482.6,
"r_y1": 438.4,
"r_x2": 482.6,
"r_y2": 432.0,
"r_x3": 476.2,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "49",
"orig": "49",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 438.4,
"r_x1": 495.5,
"r_y1": 438.4,
"r_x2": 495.5,
"r_y2": 432.0,
"r_x3": 489.2,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 438.4,
"r_x1": 508.5,
"r_y1": 438.4,
"r_x2": 508.5,
"r_y2": 432.0,
"r_x3": 502.1,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "51",
"orig": "51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 438.4,
"r_x1": 521.4,
"r_y1": 438.4,
"r_x2": 521.4,
"r_y2": 432.0,
"r_x3": 515.1,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "52",
"orig": "52",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.0,
"r_y0": 438.4,
"r_x1": 534.4,
"r_y1": 438.4,
"r_x2": 534.4,
"r_y2": 432.0,
"r_x3": 528.0,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "53",
"orig": "53",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 395.5,
"r_x1": 388.4,
"r_y1": 395.5,
"r_x2": 388.4,
"r_y2": 389.2,
"r_x3": 385.3,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 395.5,
"r_x1": 401.7,
"r_y1": 395.5,
"r_x2": 401.7,
"r_y2": 389.2,
"r_x3": 398.5,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 395.5,
"r_x1": 414.6,
"r_y1": 395.5,
"r_x2": 414.6,
"r_y2": 389.2,
"r_x3": 411.5,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 395.5,
"r_x1": 427.6,
"r_y1": 395.5,
"r_x2": 427.6,
"r_y2": 389.2,
"r_x3": 424.4,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 395.5,
"r_x1": 440.5,
"r_y1": 395.5,
"r_x2": 440.5,
"r_y2": 389.2,
"r_x3": 437.4,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 395.5,
"r_x1": 453.5,
"r_y1": 395.5,
"r_x2": 453.5,
"r_y2": 389.2,
"r_x3": 450.3,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 395.5,
"r_x1": 466.4,
"r_y1": 395.5,
"r_x2": 466.4,
"r_y2": 389.2,
"r_x3": 463.3,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 395.5,
"r_x1": 479.4,
"r_y1": 395.5,
"r_x2": 479.4,
"r_y2": 389.2,
"r_x3": 476.2,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 395.5,
"r_x1": 492.3,
"r_y1": 395.5,
"r_x2": 492.3,
"r_y2": 389.2,
"r_x3": 489.2,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 395.5,
"r_x1": 505.3,
"r_y1": 395.5,
"r_x2": 505.3,
"r_y2": 389.2,
"r_x3": 502.1,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 395.5,
"r_x1": 521.4,
"r_y1": 395.5,
"r_x2": 521.4,
"r_y2": 389.2,
"r_x3": 515.1,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.0,
"r_y0": 395.5,
"r_x1": 534.1,
"r_y1": 395.5,
"r_x2": 534.1,
"r_y2": 389.2,
"r_x3": 528.0,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 405.3,
"r_x1": 391.6,
"r_y1": 405.3,
"r_x2": 391.6,
"r_y2": 399.0,
"r_x3": 385.3,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 405.3,
"r_x1": 404.8,
"r_y1": 405.3,
"r_x2": 404.8,
"r_y2": 399.0,
"r_x3": 398.5,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 405.3,
"r_x1": 417.8,
"r_y1": 405.3,
"r_x2": 417.8,
"r_y2": 399.0,
"r_x3": 411.5,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 413.1,
"r_x1": 430.7,
"r_y1": 413.1,
"r_x2": 430.7,
"r_y2": 406.8,
"r_x3": 424.4,
"r_y3": 406.8,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.9,
"r_y0": 417.3,
"r_x1": 509.2,
"r_y1": 417.3,
"r_x2": 509.2,
"r_y2": 411.0,
"r_x3": 502.9,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "29",
"orig": "29",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.4,
"r_y0": 386.4,
"r_x1": 431.0,
"r_y1": 386.4,
"r_x2": 431.0,
"r_y2": 381.8,
"r_x3": 384.4,
"r_y3": 381.8,
"coord_origin": "TOPLEFT"
},
"text": "Predicted Structure",
"orig": "Predicted Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 169,
"label": "text",
"bbox": {
"l": 437.4,
"t": 400.6,
"r": 443.7,
"b": 406.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 406.9,
"r_x1": 443.7,
"r_y1": 406.9,
"r_x2": 443.7,
"r_y2": 400.6,
"r_x3": 437.4,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 170,
"label": "text",
"bbox": {
"l": 450.3,
"t": 400.6,
"r": 456.7,
"b": 406.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 406.9,
"r_x1": 456.7,
"r_y1": 406.9,
"r_x2": 456.7,
"r_y2": 400.6,
"r_x3": 450.3,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "17",
"orig": "17",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 171,
"label": "text",
"bbox": {
"l": 463.3,
"t": 400.6,
"r": 469.6,
"b": 406.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 406.9,
"r_x1": 469.6,
"r_y1": 406.9,
"r_x2": 469.6,
"r_y2": 400.6,
"r_x3": 463.3,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "18",
"orig": "18",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 172,
"label": "text",
"bbox": {
"l": 476.2,
"t": 400.6,
"r": 482.6,
"b": 406.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 406.9,
"r_x1": 482.6,
"r_y1": 406.9,
"r_x2": 482.6,
"r_y2": 400.6,
"r_x3": 476.2,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "19",
"orig": "19",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 173,
"label": "text",
"bbox": {
"l": 489.2,
"t": 400.6,
"r": 495.5,
"b": 406.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 406.9,
"r_x1": 495.5,
"r_y1": 406.9,
"r_x2": 495.5,
"r_y2": 400.6,
"r_x3": 489.2,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "20",
"orig": "20",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 174,
"label": "text",
"bbox": {
"l": 502.1,
"t": 400.6,
"r": 508.5,
"b": 406.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 406.9,
"r_x1": 508.5,
"r_y1": 406.9,
"r_x2": 508.5,
"r_y2": 400.6,
"r_x3": 502.1,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "21",
"orig": "21",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 175,
"label": "text",
"bbox": {
"l": 515.1,
"t": 400.6,
"r": 521.4,
"b": 406.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 406.9,
"r_x1": 521.4,
"r_y1": 406.9,
"r_x2": 521.4,
"r_y2": 400.6,
"r_x3": 515.1,
"r_y3": 400.6,
"coord_origin": "TOPLEFT"
},
"text": "22",
"orig": "22",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 176,
"label": "text",
"bbox": {
"l": 385.3,
"t": 411.0,
"r": 391.6,
"b": 417.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 417.4,
"r_x1": 391.6,
"r_y1": 417.4,
"r_x2": 391.6,
"r_y2": 411.0,
"r_x3": 385.3,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "23",
"orig": "23",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 177,
"label": "text",
"bbox": {
"l": 398.5,
"t": 411.0,
"r": 404.8,
"b": 417.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 417.4,
"r_x1": 404.8,
"r_y1": 417.4,
"r_x2": 404.8,
"r_y2": 411.0,
"r_x3": 398.5,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "24",
"orig": "24",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 178,
"label": "text",
"bbox": {
"l": 411.5,
"t": 411.0,
"r": 417.8,
"b": 417.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 417.4,
"r_x1": 417.8,
"r_y1": 417.4,
"r_x2": 417.8,
"r_y2": 411.0,
"r_x3": 411.5,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "25",
"orig": "25",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 179,
"label": "text",
"bbox": {
"l": 437.4,
"t": 411.0,
"r": 443.7,
"b": 417.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 417.4,
"r_x1": 443.7,
"r_y1": 417.4,
"r_x2": 443.7,
"r_y2": 411.0,
"r_x3": 437.4,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "26",
"orig": "26",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 180,
"label": "text",
"bbox": {
"l": 450.3,
"t": 411.0,
"r": 456.7,
"b": 417.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 417.4,
"r_x1": 456.7,
"r_y1": 417.4,
"r_x2": 456.7,
"r_y2": 411.0,
"r_x3": 450.3,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "27",
"orig": "27",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 181,
"label": "text",
"bbox": {
"l": 463.3,
"t": 411.0,
"r": 469.6,
"b": 417.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 417.4,
"r_x1": 469.6,
"r_y1": 417.4,
"r_x2": 469.6,
"r_y2": 411.0,
"r_x3": 463.3,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "28",
"orig": "28",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 182,
"label": "text",
"bbox": {
"l": 385.3,
"t": 421.1,
"r": 391.6,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 427.4,
"r_x1": 391.6,
"r_y1": 427.4,
"r_x2": 391.6,
"r_y2": 421.1,
"r_x3": 385.3,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "30",
"orig": "30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 183,
"label": "text",
"bbox": {
"l": 398.5,
"t": 421.1,
"r": 404.8,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 427.4,
"r_x1": 404.8,
"r_y1": 427.4,
"r_x2": 404.8,
"r_y2": 421.1,
"r_x3": 398.5,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "31",
"orig": "31",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 184,
"label": "text",
"bbox": {
"l": 411.5,
"t": 421.1,
"r": 417.8,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 427.4,
"r_x1": 417.8,
"r_y1": 427.4,
"r_x2": 417.8,
"r_y2": 421.1,
"r_x3": 411.5,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "32",
"orig": "32",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 185,
"label": "text",
"bbox": {
"l": 424.4,
"t": 421.1,
"r": 430.7,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 427.4,
"r_x1": 430.7,
"r_y1": 427.4,
"r_x2": 430.7,
"r_y2": 421.1,
"r_x3": 424.4,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "33",
"orig": "33",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 186,
"label": "text",
"bbox": {
"l": 437.4,
"t": 421.1,
"r": 443.7,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 427.4,
"r_x1": 443.7,
"r_y1": 427.4,
"r_x2": 443.7,
"r_y2": 421.1,
"r_x3": 437.4,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "34",
"orig": "34",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 187,
"label": "text",
"bbox": {
"l": 450.3,
"t": 421.1,
"r": 456.7,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 427.4,
"r_x1": 456.7,
"r_y1": 427.4,
"r_x2": 456.7,
"r_y2": 421.1,
"r_x3": 450.3,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "35",
"orig": "35",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 188,
"label": "text",
"bbox": {
"l": 463.3,
"t": 421.1,
"r": 469.6,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 427.4,
"r_x1": 469.6,
"r_y1": 427.4,
"r_x2": 469.6,
"r_y2": 421.1,
"r_x3": 463.3,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "36",
"orig": "36",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 189,
"label": "text",
"bbox": {
"l": 476.2,
"t": 421.1,
"r": 482.6,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 427.4,
"r_x1": 482.6,
"r_y1": 427.4,
"r_x2": 482.6,
"r_y2": 421.1,
"r_x3": 476.2,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "37",
"orig": "37",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 190,
"label": "text",
"bbox": {
"l": 489.2,
"t": 421.1,
"r": 495.5,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 427.4,
"r_x1": 495.5,
"r_y1": 427.4,
"r_x2": 495.5,
"r_y2": 421.1,
"r_x3": 489.2,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "38",
"orig": "38",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 191,
"label": "text",
"bbox": {
"l": 502.1,
"t": 421.1,
"r": 508.5,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 427.4,
"r_x1": 508.5,
"r_y1": 427.4,
"r_x2": 508.5,
"r_y2": 421.1,
"r_x3": 502.1,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "39",
"orig": "39",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 192,
"label": "text",
"bbox": {
"l": 515.1,
"t": 421.1,
"r": 521.4,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 427.4,
"r_x1": 521.4,
"r_y1": 427.4,
"r_x2": 521.4,
"r_y2": 421.1,
"r_x3": 515.1,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "40",
"orig": "40",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 193,
"label": "text",
"bbox": {
"l": 528.0,
"t": 421.1,
"r": 534.4,
"b": 427.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.0,
"r_y0": 427.4,
"r_x1": 534.4,
"r_y1": 427.4,
"r_x2": 534.4,
"r_y2": 421.1,
"r_x3": 528.0,
"r_y3": 421.1,
"coord_origin": "TOPLEFT"
},
"text": "41",
"orig": "41",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 194,
"label": "text",
"bbox": {
"l": 385.3,
"t": 432.0,
"r": 391.6,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 438.4,
"r_x1": 391.6,
"r_y1": 438.4,
"r_x2": 391.6,
"r_y2": 432.0,
"r_x3": 385.3,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "42",
"orig": "42",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 195,
"label": "text",
"bbox": {
"l": 398.5,
"t": 432.0,
"r": 404.8,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 438.4,
"r_x1": 404.8,
"r_y1": 438.4,
"r_x2": 404.8,
"r_y2": 432.0,
"r_x3": 398.5,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "43",
"orig": "43",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 196,
"label": "text",
"bbox": {
"l": 411.5,
"t": 432.0,
"r": 417.8,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 438.4,
"r_x1": 417.8,
"r_y1": 438.4,
"r_x2": 417.8,
"r_y2": 432.0,
"r_x3": 411.5,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "44",
"orig": "44",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 197,
"label": "text",
"bbox": {
"l": 424.4,
"t": 432.0,
"r": 430.7,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 438.4,
"r_x1": 430.7,
"r_y1": 438.4,
"r_x2": 430.7,
"r_y2": 432.0,
"r_x3": 424.4,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "45",
"orig": "45",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 198,
"label": "text",
"bbox": {
"l": 437.4,
"t": 432.0,
"r": 443.7,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 438.4,
"r_x1": 443.7,
"r_y1": 438.4,
"r_x2": 443.7,
"r_y2": 432.0,
"r_x3": 437.4,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "46",
"orig": "46",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 199,
"label": "text",
"bbox": {
"l": 450.3,
"t": 432.0,
"r": 456.7,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 438.4,
"r_x1": 456.7,
"r_y1": 438.4,
"r_x2": 456.7,
"r_y2": 432.0,
"r_x3": 450.3,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "47",
"orig": "47",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 200,
"label": "text",
"bbox": {
"l": 463.3,
"t": 432.0,
"r": 469.6,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 438.4,
"r_x1": 469.6,
"r_y1": 438.4,
"r_x2": 469.6,
"r_y2": 432.0,
"r_x3": 463.3,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "48",
"orig": "48",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 201,
"label": "text",
"bbox": {
"l": 476.2,
"t": 432.0,
"r": 482.6,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 438.4,
"r_x1": 482.6,
"r_y1": 438.4,
"r_x2": 482.6,
"r_y2": 432.0,
"r_x3": 476.2,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "49",
"orig": "49",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 202,
"label": "text",
"bbox": {
"l": 489.2,
"t": 432.0,
"r": 495.5,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 438.4,
"r_x1": 495.5,
"r_y1": 438.4,
"r_x2": 495.5,
"r_y2": 432.0,
"r_x3": 489.2,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "50",
"orig": "50",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 203,
"label": "text",
"bbox": {
"l": 502.1,
"t": 432.0,
"r": 508.5,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 438.4,
"r_x1": 508.5,
"r_y1": 438.4,
"r_x2": 508.5,
"r_y2": 432.0,
"r_x3": 502.1,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "51",
"orig": "51",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 204,
"label": "text",
"bbox": {
"l": 515.1,
"t": 432.0,
"r": 521.4,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 438.4,
"r_x1": 521.4,
"r_y1": 438.4,
"r_x2": 521.4,
"r_y2": 432.0,
"r_x3": 515.1,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "52",
"orig": "52",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 205,
"label": "text",
"bbox": {
"l": 528.0,
"t": 432.0,
"r": 534.4,
"b": 438.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.0,
"r_y0": 438.4,
"r_x1": 534.4,
"r_y1": 438.4,
"r_x2": 534.4,
"r_y2": 432.0,
"r_x3": 528.0,
"r_y3": 432.0,
"coord_origin": "TOPLEFT"
},
"text": "53",
"orig": "53",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 206,
"label": "text",
"bbox": {
"l": 385.3,
"t": 389.2,
"r": 388.4,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 395.5,
"r_x1": 388.4,
"r_y1": 395.5,
"r_x2": 388.4,
"r_y2": 389.2,
"r_x3": 385.3,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "0",
"orig": "0",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 207,
"label": "text",
"bbox": {
"l": 398.5,
"t": 389.2,
"r": 401.7,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 395.5,
"r_x1": 401.7,
"r_y1": 395.5,
"r_x2": 401.7,
"r_y2": 389.2,
"r_x3": 398.5,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "1",
"orig": "1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 208,
"label": "text",
"bbox": {
"l": 411.5,
"t": 389.2,
"r": 414.6,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 395.5,
"r_x1": 414.6,
"r_y1": 395.5,
"r_x2": 414.6,
"r_y2": 389.2,
"r_x3": 411.5,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 209,
"label": "text",
"bbox": {
"l": 424.4,
"t": 389.2,
"r": 427.6,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 395.5,
"r_x1": 427.6,
"r_y1": 395.5,
"r_x2": 427.6,
"r_y2": 389.2,
"r_x3": 424.4,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 210,
"label": "text",
"bbox": {
"l": 437.4,
"t": 389.2,
"r": 440.5,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.4,
"r_y0": 395.5,
"r_x1": 440.5,
"r_y1": 395.5,
"r_x2": 440.5,
"r_y2": 389.2,
"r_x3": 437.4,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "4",
"orig": "4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 211,
"label": "text",
"bbox": {
"l": 450.3,
"t": 389.2,
"r": 453.5,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 450.3,
"r_y0": 395.5,
"r_x1": 453.5,
"r_y1": 395.5,
"r_x2": 453.5,
"r_y2": 389.2,
"r_x3": 450.3,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "5",
"orig": "5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 212,
"label": "text",
"bbox": {
"l": 463.3,
"t": 389.2,
"r": 466.4,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 463.3,
"r_y0": 395.5,
"r_x1": 466.4,
"r_y1": 395.5,
"r_x2": 466.4,
"r_y2": 389.2,
"r_x3": 463.3,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "6",
"orig": "6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 213,
"label": "text",
"bbox": {
"l": 476.2,
"t": 389.2,
"r": 479.4,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 476.2,
"r_y0": 395.5,
"r_x1": 479.4,
"r_y1": 395.5,
"r_x2": 479.4,
"r_y2": 389.2,
"r_x3": 476.2,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "7",
"orig": "7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 214,
"label": "text",
"bbox": {
"l": 489.2,
"t": 389.2,
"r": 492.3,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.2,
"r_y0": 395.5,
"r_x1": 492.3,
"r_y1": 395.5,
"r_x2": 492.3,
"r_y2": 389.2,
"r_x3": 489.2,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 215,
"label": "text",
"bbox": {
"l": 502.1,
"t": 389.2,
"r": 505.3,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.1,
"r_y0": 395.5,
"r_x1": 505.3,
"r_y1": 395.5,
"r_x2": 505.3,
"r_y2": 389.2,
"r_x3": 502.1,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 216,
"label": "text",
"bbox": {
"l": 515.1,
"t": 389.2,
"r": 521.4,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 515.1,
"r_y0": 395.5,
"r_x1": 521.4,
"r_y1": 395.5,
"r_x2": 521.4,
"r_y2": 389.2,
"r_x3": 515.1,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 217,
"label": "text",
"bbox": {
"l": 528.0,
"t": 389.2,
"r": 534.1,
"b": 395.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 528.0,
"r_y0": 395.5,
"r_x1": 534.1,
"r_y1": 395.5,
"r_x2": 534.1,
"r_y2": 389.2,
"r_x3": 528.0,
"r_y3": 389.2,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 218,
"label": "text",
"bbox": {
"l": 385.3,
"t": 399.0,
"r": 391.6,
"b": 405.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.3,
"r_y0": 405.3,
"r_x1": 391.6,
"r_y1": 405.3,
"r_x2": 391.6,
"r_y2": 399.0,
"r_x3": 385.3,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 219,
"label": "text",
"bbox": {
"l": 398.5,
"t": 399.0,
"r": 404.8,
"b": 405.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 398.5,
"r_y0": 405.3,
"r_x1": 404.8,
"r_y1": 405.3,
"r_x2": 404.8,
"r_y2": 399.0,
"r_x3": 398.5,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 220,
"label": "text",
"bbox": {
"l": 411.5,
"t": 399.0,
"r": 417.8,
"b": 405.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 411.5,
"r_y0": 405.3,
"r_x1": 417.8,
"r_y1": 405.3,
"r_x2": 417.8,
"r_y2": 399.0,
"r_x3": 411.5,
"r_y3": 399.0,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 221,
"label": "text",
"bbox": {
"l": 424.4,
"t": 406.8,
"r": 430.7,
"b": 413.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 424.4,
"r_y0": 413.1,
"r_x1": 430.7,
"r_y1": 413.1,
"r_x2": 430.7,
"r_y2": 406.8,
"r_x3": 424.4,
"r_y3": 406.8,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 222,
"label": "text",
"bbox": {
"l": 502.9,
"t": 411.0,
"r": 509.2,
"b": 417.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 502.9,
"r_y0": 417.3,
"r_x1": 509.2,
"r_y1": 417.3,
"r_x2": 509.2,
"r_y2": 411.0,
"r_x3": 502.9,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "29",
"orig": "29",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 223,
"label": "text",
"bbox": {
"l": 384.4,
"t": 381.8,
"r": 431.0,
"b": 386.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 384.4,
"r_y0": 386.4,
"r_x1": 431.0,
"r_y1": 386.4,
"r_x2": 431.0,
"r_y2": 381.8,
"r_x3": 384.4,
"r_y3": 381.8,
"coord_origin": "TOPLEFT"
},
"text": "Predicted Structure",
"orig": "Predicted Structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "caption",
"id": 5,
"page_no": 7,
"cluster": {
"id": 5,
"label": "caption",
"bbox": {
"l": 62.6,
"t": 458.7,
"r": 532.6,
"b": 467.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.92,
"cells": [
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.6,
"r_y0": 467.6,
"r_x1": 532.6,
"r_y1": 467.6,
"r_x2": 532.6,
"r_y2": 458.7,
"r_x3": 62.6,
"r_y3": 458.7,
"coord_origin": "TOPLEFT"
},
"text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.",
"orig": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table."
},
{
"label": "section_header",
"id": 2,
"page_no": 7,
"cluster": {
"id": 2,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 491.4,
"r": 163.8,
"b": 501.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 501.2,
"r_x1": 64.4,
"r_y1": 501.2,
"r_x2": 64.4,
"r_y2": 491.4,
"r_x3": 50.1,
"r_y3": 491.4,
"coord_origin": "TOPLEFT"
},
"text": "5.5.",
"orig": "5.5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.0,
"r_y0": 501.2,
"r_x1": 163.8,
"r_y1": 501.2,
"r_x2": 163.8,
"r_y2": 491.4,
"r_x3": 74.0,
"r_y3": 491.4,
"coord_origin": "TOPLEFT"
},
"text": "Qualitative Analysis",
"orig": "Qualitative Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5.5. Qualitative Analysis"
},
{
"label": "text",
"id": 1,
"page_no": 7,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.1,
"t": 536.9,
"r": 286.4,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 545.8,
"r_x1": 286.4,
"r_y1": 545.8,
"r_x2": 286.4,
"r_y2": 536.9,
"r_x3": 62.1,
"r_y3": 536.9,
"coord_origin": "TOPLEFT"
},
"text": "We showcase several visualizations for the different",
"orig": "We showcase several visualizations for the different",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 557.7,
"r_x1": 211.2,
"r_y1": 557.7,
"r_x2": 211.2,
"r_y2": 548.8,
"r_x3": 50.1,
"r_y3": 548.8,
"coord_origin": "TOPLEFT"
},
"text": "components of our network on various",
"orig": "components of our network on various",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 215.1,
"r_y0": 557.5,
"r_x1": 259.2,
"r_y1": 557.5,
"r_x2": 259.2,
"r_y2": 548.9,
"r_x3": 215.1,
"r_y3": 548.9,
"coord_origin": "TOPLEFT"
},
"text": "\u201ccomplex\u201d",
"orig": "\u201ccomplex\u201d",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.1,
"r_y0": 557.7,
"r_x1": 286.4,
"r_y1": 557.7,
"r_x2": 286.4,
"r_y2": 548.8,
"r_x3": 263.1,
"r_y3": 548.8,
"coord_origin": "TOPLEFT"
},
"text": "tables",
"orig": "tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 569.7,
"r_x1": 286.4,
"r_y1": 569.7,
"r_x2": 286.4,
"r_y2": 560.8,
"r_x3": 50.1,
"r_y3": 560.8,
"coord_origin": "TOPLEFT"
},
"text": "within datasets presented in this work in Fig. 5 and Fig. 6",
"orig": "within datasets presented in this work in Fig. 5 and Fig. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 581.6,
"r_x1": 286.4,
"r_y1": 581.6,
"r_x2": 286.4,
"r_y2": 572.7,
"r_x3": 50.1,
"r_y3": 572.7,
"coord_origin": "TOPLEFT"
},
"text": "As it is shown, our model is able to predict bounding boxes",
"orig": "As it is shown, our model is able to predict bounding boxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 593.6,
"r_x1": 286.4,
"r_y1": 593.6,
"r_x2": 286.4,
"r_y2": 584.7,
"r_x3": 50.1,
"r_y3": 584.7,
"coord_origin": "TOPLEFT"
},
"text": "for all table cells, even for the empty ones. Additionally,",
"orig": "for all table cells, even for the empty ones. Additionally,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 605.6,
"r_x1": 286.4,
"r_y1": 605.6,
"r_x2": 286.4,
"r_y2": 596.6,
"r_x3": 50.1,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "our post-processing techniques can extract the cell content",
"orig": "our post-processing techniques can extract the cell content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 617.5,
"r_x1": 286.4,
"r_y1": 617.5,
"r_x2": 286.4,
"r_y2": 608.6,
"r_x3": 50.1,
"r_y3": 608.6,
"coord_origin": "TOPLEFT"
},
"text": "by matching the predicted bounding boxes to the PDF cells",
"orig": "by matching the predicted bounding boxes to the PDF cells",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 629.5,
"r_x1": 286.4,
"r_y1": 629.5,
"r_x2": 286.4,
"r_y2": 620.6,
"r_x3": 50.1,
"r_y3": 620.6,
"coord_origin": "TOPLEFT"
},
"text": "based on their overlap and spatial proximity. The left part",
"orig": "based on their overlap and spatial proximity. The left part",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 641.4,
"r_x1": 286.4,
"r_y1": 641.4,
"r_x2": 286.4,
"r_y2": 632.5,
"r_x3": 50.1,
"r_y3": 632.5,
"coord_origin": "TOPLEFT"
},
"text": "of Fig. 5 demonstrates also the adaptability of our method",
"orig": "of Fig. 5 demonstrates also the adaptability of our method",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 653.4,
"r_x1": 286.4,
"r_y1": 653.4,
"r_x2": 286.4,
"r_y2": 644.5,
"r_x3": 50.1,
"r_y3": 644.5,
"coord_origin": "TOPLEFT"
},
"text": "to any language, as it can successfully extract Japanese",
"orig": "to any language, as it can successfully extract Japanese",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 665.3,
"r_x1": 286.4,
"r_y1": 665.3,
"r_x2": 286.4,
"r_y2": 656.4,
"r_x3": 50.1,
"r_y3": 656.4,
"coord_origin": "TOPLEFT"
},
"text": "text, although the training set contains only English content.",
"orig": "text, although the training set contains only English content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.3,
"r_x1": 286.4,
"r_y1": 677.3,
"r_x2": 286.4,
"r_y2": 668.4,
"r_x3": 50.1,
"r_y3": 668.4,
"coord_origin": "TOPLEFT"
},
"text": "We provide more visualizations including the intermediate",
"orig": "We provide more visualizations including the intermediate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 689.2,
"r_x1": 286.4,
"r_y1": 689.2,
"r_x2": 286.4,
"r_y2": 680.3,
"r_x3": 50.1,
"r_y3": 680.3,
"coord_origin": "TOPLEFT"
},
"text": "steps in the supplementary material. Overall these illustra-",
"orig": "steps in the supplementary material. Overall these illustra-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 50.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "tions justify the versatility of our method across a diverse",
"orig": "tions justify the versatility of our method across a diverse",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 226.9,
"r_y1": 713.2,
"r_x2": 226.9,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "range of table appearances and content type.",
"orig": "range of table appearances and content type.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "We showcase several visualizations for the different components of our network on various \"complex\" tables within datasets presented in this work in Fig. 5 and Fig. 6 As it is shown, our model is able to predict bounding boxes for all table cells, even for the empty ones. Additionally, our post-processing techniques can extract the cell content by matching the predicted bounding boxes to the PDF cells based on their overlap and spatial proximity. The left part of Fig. 5 demonstrates also the adaptability of our method to any language, as it can successfully extract Japanese text, although the training set contains only English content. We provide more visualizations including the intermediate steps in the supplementary material. Overall these illustrations justify the versatility of our method across a diverse range of table appearances and content type."
},
{
"label": "section_header",
"id": 4,
"page_no": 7,
"cluster": {
"id": 4,
"label": "section_header",
"bbox": {
"l": 308.9,
"t": 490.7,
"r": 460.8,
"b": 501.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 201,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 501.5,
"r_x1": 316.1,
"r_y1": 501.5,
"r_x2": 316.1,
"r_y2": 490.7,
"r_x3": 308.9,
"r_y3": 490.7,
"coord_origin": "TOPLEFT"
},
"text": "6.",
"orig": "6.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 202,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 325.7,
"r_y0": 501.5,
"r_x1": 460.8,
"r_y1": 501.5,
"r_x2": 460.8,
"r_y2": 490.7,
"r_x3": 325.7,
"r_y3": 490.7,
"coord_origin": "TOPLEFT"
},
"text": "Future Work & Conclusion",
"orig": "Future Work & Conclusion",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "6. Future Work & Conclusion"
},
{
"label": "text",
"id": 0,
"page_no": 7,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 308.9,
"t": 512.9,
"r": 545.1,
"b": 653.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 203,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 521.8,
"r_x1": 545.1,
"r_y1": 521.8,
"r_x2": 545.1,
"r_y2": 512.9,
"r_x3": 320.8,
"r_y3": 512.9,
"coord_origin": "TOPLEFT"
},
"text": "In this paper, we presented TableFormer an end-to-end",
"orig": "In this paper, we presented TableFormer an end-to-end",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 204,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 533.8,
"r_x1": 545.1,
"r_y1": 533.8,
"r_x2": 545.1,
"r_y2": 524.8,
"r_x3": 308.9,
"r_y3": 524.8,
"coord_origin": "TOPLEFT"
},
"text": "transformer based approach to predict table structures and",
"orig": "transformer based approach to predict table structures and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 205,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 545.7,
"r_x1": 545.1,
"r_y1": 545.7,
"r_x2": 545.1,
"r_y2": 536.8,
"r_x3": 308.9,
"r_y3": 536.8,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes of cells from an image. This approach en-",
"orig": "bounding boxes of cells from an image. This approach en-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 206,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 557.7,
"r_x1": 545.1,
"r_y1": 557.7,
"r_x2": 545.1,
"r_y2": 548.8,
"r_x3": 308.9,
"r_y3": 548.8,
"coord_origin": "TOPLEFT"
},
"text": "ables us to recreate the table structure, and extract the cell",
"orig": "ables us to recreate the table structure, and extract the cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 207,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 569.6,
"r_x1": 545.1,
"r_y1": 569.6,
"r_x2": 545.1,
"r_y2": 560.7,
"r_x3": 308.9,
"r_y3": 560.7,
"coord_origin": "TOPLEFT"
},
"text": "content from PDF or OCR by using bounding boxes. Ad-",
"orig": "content from PDF or OCR by using bounding boxes. Ad-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 208,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 581.6,
"r_x1": 545.1,
"r_y1": 581.6,
"r_x2": 545.1,
"r_y2": 572.7,
"r_x3": 308.9,
"r_y3": 572.7,
"coord_origin": "TOPLEFT"
},
"text": "ditionally, it provides the versatility required in real-world",
"orig": "ditionally, it provides the versatility required in real-world",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 209,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 593.5,
"r_x1": 545.1,
"r_y1": 593.5,
"r_x2": 545.1,
"r_y2": 584.6,
"r_x3": 308.9,
"r_y3": 584.6,
"coord_origin": "TOPLEFT"
},
"text": "scenarios when dealing with various types of PDF docu-",
"orig": "scenarios when dealing with various types of PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 210,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 605.5,
"r_x1": 400.5,
"r_y1": 605.5,
"r_x2": 400.5,
"r_y2": 596.6,
"r_x3": 308.9,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "ments, and languages.",
"orig": "ments, and languages.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 211,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 408.4,
"r_y0": 605.5,
"r_x1": 545.1,
"r_y1": 605.5,
"r_x2": 545.1,
"r_y2": 596.6,
"r_x3": 408.4,
"r_y3": 596.6,
"coord_origin": "TOPLEFT"
},
"text": "Furthermore, our method outper-",
"orig": "Furthermore, our method outper-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 212,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 617.4,
"r_x1": 545.1,
"r_y1": 617.4,
"r_x2": 545.1,
"r_y2": 608.5,
"r_x3": 308.9,
"r_y3": 608.5,
"coord_origin": "TOPLEFT"
},
"text": "forms all state-of-the-arts with a wide margin. Finally, we",
"orig": "forms all state-of-the-arts with a wide margin. Finally, we",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 213,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 629.4,
"r_x1": 545.1,
"r_y1": 629.4,
"r_x2": 545.1,
"r_y2": 620.5,
"r_x3": 308.9,
"r_y3": 620.5,
"coord_origin": "TOPLEFT"
},
"text": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-",
"orig": "introduce \u201cSynthTabNet\u201d a challenging synthetically gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 214,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 641.4,
"r_x1": 545.1,
"r_y1": 641.4,
"r_x2": 545.1,
"r_y2": 632.4,
"r_x3": 308.9,
"r_y3": 632.4,
"coord_origin": "TOPLEFT"
},
"text": "erated dataset that reinforces missing characteristics from",
"orig": "erated dataset that reinforces missing characteristics from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 215,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 653.3,
"r_x1": 365.9,
"r_y1": 653.3,
"r_x2": 365.9,
"r_y2": 644.4,
"r_x3": 308.9,
"r_y3": 644.4,
"coord_origin": "TOPLEFT"
},
"text": "other datasets.",
"orig": "other datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "In this paper, we presented TableFormer an end-to-end transformer based approach to predict table structures and bounding boxes of cells from an image. This approach enables us to recreate the table structure, and extract the cell content from PDF or OCR by using bounding boxes. Additionally, it provides the versatility required in real-world scenarios when dealing with various types of PDF documents, and languages. Furthermore, our method outperforms all state-of-the-arts with a wide margin. Finally, we introduce \"SynthTabNet\" a challenging synthetically generated dataset that reinforces missing characteristics from other datasets."
},
{
"label": "section_header",
"id": 3,
"page_no": 7,
"cluster": {
"id": 3,
"label": "section_header",
"bbox": {
"l": 308.9,
"t": 672.1,
"r": 364.4,
"b": 682.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 216,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 682.8,
"r_x1": 364.4,
"r_y1": 682.8,
"r_x2": 364.4,
"r_y2": 672.1,
"r_x3": 308.9,
"r_y3": 672.1,
"coord_origin": "TOPLEFT"
},
"text": "References",
"orig": "References",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "References"
},
{
"label": "list_item",
"id": 10,
"page_no": 7,
"cluster": {
"id": 10,
"label": "list_item",
"bbox": {
"l": 313.3,
"t": 694.0,
"r": 545.1,
"b": 712.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.83,
"cells": [
{
"index": 217,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 313.3,
"r_y0": 702.0,
"r_x1": 323.8,
"r_y1": 702.0,
"r_x2": 323.8,
"r_y2": 694.0,
"r_x3": 313.3,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "[1]",
"orig": "[1]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 218,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.1,
"r_y0": 702.0,
"r_x1": 545.1,
"r_y1": 702.0,
"r_x2": 545.1,
"r_y2": 694.0,
"r_x3": 326.1,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas",
"orig": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 219,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 712.9,
"r_x1": 545.1,
"r_y1": 712.9,
"r_x2": 545.1,
"r_y2": 704.9,
"r_x3": 328.8,
"r_y3": 704.9,
"coord_origin": "TOPLEFT"
},
"text": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-",
"orig": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[1] Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-"
},
{
"label": "picture",
"id": 15,
"page_no": 7,
"cluster": {
"id": 15,
"label": "picture",
"bbox": {
"l": 305.6,
"t": 98.7,
"r": 554.8,
"b": 180.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.77,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 14,
"page_no": 7,
"cluster": {
"id": 14,
"label": "picture",
"bbox": {
"l": 50.0,
"t": 103.7,
"r": 301.6,
"b": 187.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.79,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
}
],
"headers": [
{
"label": "page_footer",
"id": 9,
"page_no": 7,
"cluster": {
"id": 9,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.87,
"cells": [
{
"index": 220,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "8",
"orig": "8",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "8"
}
]
}
},
{
"page_no": 8,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 83.9,
"r_x1": 286.4,
"r_y1": 83.9,
"r_x2": 286.4,
"r_y2": 75.9,
"r_x3": 70.0,
"r_y3": 75.9,
"coord_origin": "TOPLEFT"
},
"text": "end object detection with transformers. In Andrea Vedaldi,",
"orig": "end object detection with transformers. In Andrea Vedaldi,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 94.9,
"r_x1": 286.4,
"r_y1": 94.9,
"r_x2": 286.4,
"r_y2": 86.8,
"r_x3": 70.0,
"r_y3": 86.8,
"coord_origin": "TOPLEFT"
},
"text": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-",
"orig": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 105.8,
"r_x1": 85.7,
"r_y1": 105.8,
"r_x2": 85.7,
"r_y2": 97.8,
"r_x3": 70.0,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "tors,",
"orig": "tors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 87.9,
"r_y0": 105.6,
"r_x1": 199.9,
"r_y1": 105.6,
"r_x2": 199.9,
"r_y2": 97.9,
"r_x3": 87.9,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision - ECCV 2020",
"orig": "Computer Vision - ECCV 2020",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 199.9,
"r_y0": 105.8,
"r_x1": 286.4,
"r_y1": 105.8,
"r_x2": 286.4,
"r_y2": 97.8,
"r_x3": 199.9,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 213-229, Cham,",
"orig": ", pages 213-229, Cham,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 116.8,
"r_x1": 221.9,
"r_y1": 116.8,
"r_x2": 221.9,
"r_y2": 108.8,
"r_x3": 70.0,
"r_y3": 108.8,
"coord_origin": "TOPLEFT"
},
"text": "2020. Springer International Publishing. 5",
"orig": "2020. Springer International Publishing. 5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 128.0,
"r_x1": 65.2,
"r_y1": 128.0,
"r_x2": 65.2,
"r_y2": 120.0,
"r_x3": 54.6,
"r_y3": 120.0,
"coord_origin": "TOPLEFT"
},
"text": "[2]",
"orig": "[2]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.5,
"r_y0": 128.0,
"r_x1": 286.4,
"r_y1": 128.0,
"r_x2": 286.4,
"r_y2": 120.0,
"r_x3": 67.5,
"r_y3": 120.0,
"coord_origin": "TOPLEFT"
},
"text": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-",
"orig": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 139.0,
"r_x1": 179.7,
"r_y1": 139.0,
"r_x2": 179.7,
"r_y2": 131.0,
"r_x3": 70.0,
"r_y3": 131.0,
"coord_origin": "TOPLEFT"
},
"text": "uan Yin, and Xian-Ling Mao.",
"orig": "uan Yin, and Xian-Ling Mao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.6,
"r_y0": 139.0,
"r_x1": 286.4,
"r_y1": 139.0,
"r_x2": 286.4,
"r_y2": 131.0,
"r_x3": 185.6,
"r_y3": 131.0,
"coord_origin": "TOPLEFT"
},
"text": "Complicated table structure",
"orig": "Complicated table structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 150.0,
"r_x1": 113.1,
"r_y1": 150.0,
"r_x2": 113.1,
"r_y2": 141.9,
"r_x3": 70.0,
"r_y3": 141.9,
"coord_origin": "TOPLEFT"
},
"text": "recognition.",
"orig": "recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.3,
"r_y0": 149.8,
"r_x1": 235.3,
"r_y1": 149.8,
"r_x2": 235.3,
"r_y2": 142.0,
"r_x3": 116.3,
"r_y3": 142.0,
"coord_origin": "TOPLEFT"
},
"text": "arXiv preprint arXiv:1908.04729",
"orig": "arXiv preprint arXiv:1908.04729",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 235.3,
"r_y0": 150.0,
"r_x1": 267.7,
"r_y1": 150.0,
"r_x2": 267.7,
"r_y2": 141.9,
"r_x3": 235.3,
"r_y3": 141.9,
"coord_origin": "TOPLEFT"
},
"text": ", 2019. 3",
"orig": ", 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 161.2,
"r_x1": 65.1,
"r_y1": 161.2,
"r_x2": 65.1,
"r_y2": 153.2,
"r_x3": 54.6,
"r_y3": 153.2,
"coord_origin": "TOPLEFT"
},
"text": "[3]",
"orig": "[3]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.4,
"r_y0": 161.2,
"r_x1": 218.8,
"r_y1": 161.2,
"r_x2": 218.8,
"r_y2": 153.2,
"r_x3": 67.4,
"r_y3": 153.2,
"coord_origin": "TOPLEFT"
},
"text": "Bertrand Couasnon and Aurelie Lemaitre.",
"orig": "Bertrand Couasnon and Aurelie Lemaitre.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 221.0,
"r_y0": 161.0,
"r_x1": 286.4,
"r_y1": 161.0,
"r_x2": 286.4,
"r_y2": 153.3,
"r_x3": 221.0,
"r_y3": 153.3,
"coord_origin": "TOPLEFT"
},
"text": "Recognition of Ta-",
"orig": "Recognition of Ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 172.0,
"r_x1": 125.3,
"r_y1": 172.0,
"r_x2": 125.3,
"r_y2": 164.3,
"r_x3": 70.0,
"r_y3": 164.3,
"coord_origin": "TOPLEFT"
},
"text": "bles and Forms",
"orig": "bles and Forms",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.3,
"r_y0": 172.2,
"r_x1": 286.4,
"r_y1": 172.2,
"r_x2": 286.4,
"r_y2": 164.2,
"r_x3": 125.3,
"r_y3": 164.2,
"coord_origin": "TOPLEFT"
},
"text": ", pages 647-677. Springer London, London,",
"orig": ", pages 647-677. Springer London, London,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 183.2,
"r_x1": 97.9,
"r_y1": 183.2,
"r_x2": 97.9,
"r_y2": 175.1,
"r_x3": 70.0,
"r_y3": 175.1,
"coord_origin": "TOPLEFT"
},
"text": "2014. 2",
"orig": "2014. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 194.4,
"r_x1": 65.8,
"r_y1": 194.4,
"r_x2": 65.8,
"r_y2": 186.4,
"r_x3": 54.6,
"r_y3": 186.4,
"coord_origin": "TOPLEFT"
},
"text": "[4]",
"orig": "[4]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.2,
"r_y0": 194.4,
"r_x1": 286.4,
"r_y1": 194.4,
"r_x2": 286.4,
"r_y2": 186.4,
"r_x3": 68.2,
"r_y3": 186.4,
"coord_origin": "TOPLEFT"
},
"text": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun",
"orig": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 205.4,
"r_x1": 286.4,
"r_y1": 205.4,
"r_x2": 286.4,
"r_y2": 197.4,
"r_x3": 70.0,
"r_y3": 197.4,
"coord_origin": "TOPLEFT"
},
"text": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-",
"orig": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 216.3,
"r_x1": 286.4,
"r_y1": 216.3,
"r_x2": 286.4,
"r_y2": 208.3,
"r_x3": 70.0,
"r_y3": 208.3,
"coord_origin": "TOPLEFT"
},
"text": "DAR 2019 Competition on Table Detection and Recognition",
"orig": "DAR 2019 Competition on Table Detection and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 227.3,
"r_x1": 245.8,
"r_y1": 227.3,
"r_x2": 245.8,
"r_y2": 219.3,
"r_x3": 70.0,
"r_y3": 219.3,
"coord_origin": "TOPLEFT"
},
"text": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2",
"orig": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 238.6,
"r_x1": 65.4,
"r_y1": 238.6,
"r_x2": 65.4,
"r_y2": 230.6,
"r_x3": 54.6,
"r_y3": 230.6,
"coord_origin": "TOPLEFT"
},
"text": "[5]",
"orig": "[5]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.7,
"r_y0": 238.6,
"r_x1": 286.4,
"r_y1": 238.6,
"r_x2": 286.4,
"r_y2": 230.6,
"r_x3": 67.7,
"r_y3": 230.6,
"coord_origin": "TOPLEFT"
},
"text": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and",
"orig": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 249.5,
"r_x1": 286.4,
"r_y1": 249.5,
"r_x2": 286.4,
"r_y2": 241.5,
"r_x3": 70.0,
"r_y3": 241.5,
"coord_origin": "TOPLEFT"
},
"text": "Stavros J Perantonis. Automatic table detection in document",
"orig": "Stavros J Perantonis. Automatic table detection in document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 260.5,
"r_x1": 108.4,
"r_y1": 260.5,
"r_x2": 108.4,
"r_y2": 252.5,
"r_x3": 70.0,
"r_y3": 252.5,
"coord_origin": "TOPLEFT"
},
"text": "images. In",
"orig": "images. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.6,
"r_y0": 260.3,
"r_x1": 286.4,
"r_y1": 260.3,
"r_x2": 286.4,
"r_y2": 252.6,
"r_x3": 110.6,
"r_y3": 252.6,
"coord_origin": "TOPLEFT"
},
"text": "International Conference on Pattern Recognition",
"orig": "International Conference on Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 271.2,
"r_x1": 140.6,
"r_y1": 271.2,
"r_x2": 140.6,
"r_y2": 263.5,
"r_x3": 70.0,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "and Image Analysis",
"orig": "and Image Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.6,
"r_y0": 271.5,
"r_x1": 266.5,
"r_y1": 271.5,
"r_x2": 266.5,
"r_y2": 263.4,
"r_x3": 140.6,
"r_y3": 263.4,
"coord_origin": "TOPLEFT"
},
"text": ", pages 609-618. Springer, 2005. 2",
"orig": ", pages 609-618. Springer, 2005. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 282.7,
"r_x1": 64.8,
"r_y1": 282.7,
"r_x2": 64.8,
"r_y2": 274.7,
"r_x3": 54.6,
"r_y3": 274.7,
"coord_origin": "TOPLEFT"
},
"text": "[6]",
"orig": "[6]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.0,
"r_y0": 282.7,
"r_x1": 286.4,
"r_y1": 282.7,
"r_x2": 286.4,
"r_y2": 274.7,
"r_x3": 67.0,
"r_y3": 274.7,
"coord_origin": "TOPLEFT"
},
"text": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.",
"orig": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 293.7,
"r_x1": 179.6,
"r_y1": 293.7,
"r_x2": 179.6,
"r_y2": 285.7,
"r_x3": 70.0,
"r_y3": 285.7,
"coord_origin": "TOPLEFT"
},
"text": "Icdar 2013 table competition.",
"orig": "Icdar 2013 table competition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.0,
"r_y0": 293.7,
"r_x1": 194.5,
"r_y1": 293.7,
"r_x2": 194.5,
"r_y2": 285.7,
"r_x3": 187.0,
"r_y3": 285.7,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 198.0,
"r_y0": 293.5,
"r_x1": 286.4,
"r_y1": 293.5,
"r_x2": 286.4,
"r_y2": 285.7,
"r_x3": 198.0,
"r_y3": 285.7,
"coord_origin": "TOPLEFT"
},
"text": "2013 12th International",
"orig": "2013 12th International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 304.4,
"r_x1": 260.2,
"r_y1": 304.4,
"r_x2": 260.2,
"r_y2": 296.7,
"r_x3": 70.0,
"r_y3": 296.7,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Document Analysis and Recognition",
"orig": "Conference on Document Analysis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 260.2,
"r_y0": 304.6,
"r_x1": 286.4,
"r_y1": 304.6,
"r_x2": 286.4,
"r_y2": 296.6,
"r_x3": 260.2,
"r_y3": 296.6,
"coord_origin": "TOPLEFT"
},
"text": ", pages",
"orig": ", pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 315.6,
"r_x1": 142.7,
"r_y1": 315.6,
"r_x2": 142.7,
"r_y2": 307.6,
"r_x3": 70.0,
"r_y3": 307.6,
"coord_origin": "TOPLEFT"
},
"text": "1449-1453, 2013. 2",
"orig": "1449-1453, 2013. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 326.9,
"r_x1": 65.6,
"r_y1": 326.9,
"r_x2": 65.6,
"r_y2": 318.9,
"r_x3": 54.6,
"r_y3": 318.9,
"coord_origin": "TOPLEFT"
},
"text": "[7]",
"orig": "[7]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.0,
"r_y0": 326.9,
"r_x1": 199.5,
"r_y1": 326.9,
"r_x2": 199.5,
"r_y2": 318.9,
"r_x3": 68.0,
"r_y3": 318.9,
"coord_origin": "TOPLEFT"
},
"text": "EA Green and M Krishnamoorthy.",
"orig": "EA Green and M Krishnamoorthy.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.0,
"r_y0": 326.9,
"r_x1": 286.4,
"r_y1": 326.9,
"r_x2": 286.4,
"r_y2": 318.9,
"r_x3": 207.0,
"r_y3": 318.9,
"coord_origin": "TOPLEFT"
},
"text": "Recognition of tables",
"orig": "Recognition of tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 337.8,
"r_x1": 176.3,
"r_y1": 337.8,
"r_x2": 176.3,
"r_y2": 329.8,
"r_x3": 70.0,
"r_y3": 329.8,
"coord_origin": "TOPLEFT"
},
"text": "using table grammars. procs.",
"orig": "using table grammars. procs.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.6,
"r_y0": 337.8,
"r_x1": 190.1,
"r_y1": 337.8,
"r_x2": 190.1,
"r_y2": 329.8,
"r_x3": 182.6,
"r_y3": 329.8,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 193.3,
"r_y0": 337.6,
"r_x1": 286.4,
"r_y1": 337.6,
"r_x2": 286.4,
"r_y2": 329.9,
"r_x3": 193.3,
"r_y3": 329.9,
"coord_origin": "TOPLEFT"
},
"text": "Symposium on Document",
"orig": "Symposium on Document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 348.6,
"r_x1": 206.3,
"r_y1": 348.6,
"r_x2": 206.3,
"r_y2": 340.9,
"r_x3": 70.0,
"r_y3": 340.9,
"coord_origin": "TOPLEFT"
},
"text": "Analysis and Recognition (SDAIR\u201995)",
"orig": "Analysis and Recognition (SDAIR\u201995)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.3,
"r_y0": 348.8,
"r_x1": 274.8,
"r_y1": 348.8,
"r_x2": 274.8,
"r_y2": 340.8,
"r_x3": 206.3,
"r_y3": 340.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 261-277. 2",
"orig": ", pages 261-277. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 360.1,
"r_x1": 65.0,
"r_y1": 360.1,
"r_x2": 65.0,
"r_y2": 352.0,
"r_x3": 54.6,
"r_y3": 352.0,
"coord_origin": "TOPLEFT"
},
"text": "[8]",
"orig": "[8]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.3,
"r_y0": 360.1,
"r_x1": 286.4,
"r_y1": 360.1,
"r_x2": 286.4,
"r_y2": 352.0,
"r_x3": 67.3,
"r_y3": 352.0,
"coord_origin": "TOPLEFT"
},
"text": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-",
"orig": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 371.0,
"r_x1": 234.1,
"r_y1": 371.0,
"r_x2": 234.1,
"r_y2": 363.0,
"r_x3": 70.0,
"r_y3": 363.0,
"coord_origin": "TOPLEFT"
},
"text": "dier Stricker, and Muhammad Zeshan Afzal.",
"orig": "dier Stricker, and Muhammad Zeshan Afzal.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 240.1,
"r_y0": 371.0,
"r_x1": 286.4,
"r_y1": 371.0,
"r_x2": 286.4,
"r_y2": 363.0,
"r_x3": 240.1,
"r_y3": 363.0,
"coord_origin": "TOPLEFT"
},
"text": "Castabdetec-",
"orig": "Castabdetec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 382.0,
"r_x1": 286.4,
"r_y1": 382.0,
"r_x2": 286.4,
"r_y2": 374.0,
"r_x3": 70.0,
"r_y3": 374.0,
"coord_origin": "TOPLEFT"
},
"text": "tors: Cascade network for table detection in document im-",
"orig": "tors: Cascade network for table detection in document im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 392.9,
"r_x1": 286.4,
"r_y1": 392.9,
"r_x2": 286.4,
"r_y2": 384.9,
"r_x3": 70.0,
"r_y3": 384.9,
"coord_origin": "TOPLEFT"
},
"text": "ages with recursive feature pyramid and switchable atrous",
"orig": "ages with recursive feature pyramid and switchable atrous",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 403.9,
"r_x1": 114.6,
"r_y1": 403.9,
"r_x2": 114.6,
"r_y2": 395.9,
"r_x3": 70.0,
"r_y3": 395.9,
"coord_origin": "TOPLEFT"
},
"text": "convolution.",
"orig": "convolution.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 117.8,
"r_y0": 403.7,
"r_x1": 186.7,
"r_y1": 403.7,
"r_x2": 186.7,
"r_y2": 396.0,
"r_x3": 117.8,
"r_y3": 396.0,
"coord_origin": "TOPLEFT"
},
"text": "Journal of Imaging",
"orig": "Journal of Imaging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 186.7,
"r_y0": 403.9,
"r_x1": 243.0,
"r_y1": 403.9,
"r_x2": 243.0,
"r_y2": 395.9,
"r_x3": 186.7,
"r_y3": 395.9,
"coord_origin": "TOPLEFT"
},
"text": ", 7(10), 2021. 1",
"orig": ", 7(10), 2021. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 415.2,
"r_x1": 65.3,
"r_y1": 415.2,
"r_x2": 65.3,
"r_y2": 407.2,
"r_x3": 54.6,
"r_y3": 407.2,
"coord_origin": "TOPLEFT"
},
"text": "[9]",
"orig": "[9]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.6,
"r_y0": 415.2,
"r_x1": 286.4,
"r_y1": 415.2,
"r_x2": 286.4,
"r_y2": 407.2,
"r_x3": 67.6,
"r_y3": 407.2,
"coord_origin": "TOPLEFT"
},
"text": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-",
"orig": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 426.1,
"r_x1": 147.1,
"r_y1": 426.1,
"r_x2": 147.1,
"r_y2": 418.1,
"r_x3": 70.0,
"r_y3": 418.1,
"coord_origin": "TOPLEFT"
},
"text": "shick. Mask r-cnn. In",
"orig": "shick. Mask r-cnn. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 149.2,
"r_y0": 425.9,
"r_x1": 286.4,
"r_y1": 425.9,
"r_x2": 286.4,
"r_y2": 418.2,
"r_x3": 149.2,
"r_y3": 418.2,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE International",
"orig": "Proceedings of the IEEE International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 436.9,
"r_x1": 213.5,
"r_y1": 436.9,
"r_x2": 213.5,
"r_y2": 429.2,
"r_x3": 70.0,
"r_y3": 429.2,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision (ICCV)",
"orig": "Conference on Computer Vision (ICCV)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 213.5,
"r_y0": 437.1,
"r_x1": 261.0,
"r_y1": 437.1,
"r_x2": 261.0,
"r_y2": 429.1,
"r_x3": 213.5,
"r_y3": 429.1,
"coord_origin": "TOPLEFT"
},
"text": ", Oct 2017. 1",
"orig": ", Oct 2017. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 448.4,
"r_x1": 65.4,
"r_y1": 448.4,
"r_x2": 65.4,
"r_y2": 440.3,
"r_x3": 50.1,
"r_y3": 440.3,
"coord_origin": "TOPLEFT"
},
"text": "[10]",
"orig": "[10]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.7,
"r_y0": 448.4,
"r_x1": 286.4,
"r_y1": 448.4,
"r_x2": 286.4,
"r_y2": 440.3,
"r_x3": 67.7,
"r_y3": 440.3,
"coord_origin": "TOPLEFT"
},
"text": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-",
"orig": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 459.3,
"r_x1": 202.7,
"r_y1": 459.3,
"r_x2": 202.7,
"r_y2": 451.3,
"r_x3": 70.0,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": "cong Li, Xin Tang, and Rong Xiao.",
"orig": "cong Li, Xin Tang, and Rong Xiao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 459.3,
"r_x1": 286.4,
"r_y1": 459.3,
"r_x2": 286.4,
"r_y2": 451.3,
"r_x3": 209.0,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": "Pingan-vcgroup\u2019s so-",
"orig": "Pingan-vcgroup\u2019s so-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 470.3,
"r_x1": 286.4,
"r_y1": 470.3,
"r_x2": 286.4,
"r_y2": 462.3,
"r_x3": 70.0,
"r_y3": 462.3,
"coord_origin": "TOPLEFT"
},
"text": "lution for icdar 2021 competition on scientific table image",
"orig": "lution for icdar 2021 competition on scientific table image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 481.2,
"r_x1": 141.9,
"r_y1": 481.2,
"r_x2": 141.9,
"r_y2": 473.2,
"r_x3": 70.0,
"r_y3": 473.2,
"coord_origin": "TOPLEFT"
},
"text": "recognition to latex.",
"orig": "recognition to latex.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 145.1,
"r_y0": 481.0,
"r_x1": 166.0,
"r_y1": 481.0,
"r_x2": 166.0,
"r_y2": 473.3,
"r_x3": 145.1,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "ArXiv",
"orig": "ArXiv",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 166.0,
"r_y0": 481.2,
"r_x1": 259.9,
"r_y1": 481.2,
"r_x2": 259.9,
"r_y2": 473.2,
"r_x3": 166.0,
"r_y3": 473.2,
"coord_origin": "TOPLEFT"
},
"text": ", abs/2105.01846, 2021. 2",
"orig": ", abs/2105.01846, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 492.5,
"r_x1": 66.0,
"r_y1": 492.5,
"r_x2": 66.0,
"r_y2": 484.5,
"r_x3": 50.1,
"r_y3": 484.5,
"coord_origin": "TOPLEFT"
},
"text": "[11]",
"orig": "[11]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.4,
"r_y0": 492.5,
"r_x1": 286.4,
"r_y1": 492.5,
"r_x2": 286.4,
"r_y2": 484.5,
"r_x3": 68.4,
"r_y3": 484.5,
"coord_origin": "TOPLEFT"
},
"text": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and",
"orig": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 503.5,
"r_x1": 286.4,
"r_y1": 503.5,
"r_x2": 286.4,
"r_y2": 495.4,
"r_x3": 70.0,
"r_y3": 495.4,
"coord_origin": "TOPLEFT"
},
"text": "Gordon Wilfong. Medium-independent table detection. In",
"orig": "Gordon Wilfong. Medium-independent table detection. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 514.2,
"r_x1": 227.4,
"r_y1": 514.2,
"r_x2": 227.4,
"r_y2": 506.5,
"r_x3": 70.0,
"r_y3": 506.5,
"coord_origin": "TOPLEFT"
},
"text": "Document Recognition and Retrieval VII",
"orig": "Document Recognition and Retrieval VII",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.4,
"r_y0": 514.4,
"r_x1": 286.4,
"r_y1": 514.4,
"r_x2": 286.4,
"r_y2": 506.4,
"r_x3": 227.4,
"r_y3": 506.4,
"coord_origin": "TOPLEFT"
},
"text": ", volume 3967,",
"orig": ", volume 3967,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 525.4,
"r_x1": 286.4,
"r_y1": 525.4,
"r_x2": 286.4,
"r_y2": 517.4,
"r_x3": 70.0,
"r_y3": 517.4,
"coord_origin": "TOPLEFT"
},
"text": "pages 291-302. International Society for Optics and Photon-",
"orig": "pages 291-302. International Society for Optics and Photon-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 536.3,
"r_x1": 112.4,
"r_y1": 536.3,
"r_x2": 112.4,
"r_y2": 528.3,
"r_x3": 70.0,
"r_y3": 528.3,
"coord_origin": "TOPLEFT"
},
"text": "ics, 1999. 2",
"orig": "ics, 1999. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 547.6,
"r_x1": 65.5,
"r_y1": 547.6,
"r_x2": 65.5,
"r_y2": 539.6,
"r_x3": 50.1,
"r_y3": 539.6,
"coord_origin": "TOPLEFT"
},
"text": "[12]",
"orig": "[12]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 547.6,
"r_x1": 286.4,
"r_y1": 547.6,
"r_x2": 286.4,
"r_y2": 539.6,
"r_x3": 67.8,
"r_y3": 539.6,
"coord_origin": "TOPLEFT"
},
"text": "Matthew Hurst. A constraint-based approach to table struc-",
"orig": "Matthew Hurst. A constraint-based approach to table struc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 558.6,
"r_x1": 136.3,
"r_y1": 558.6,
"r_x2": 136.3,
"r_y2": 550.6,
"r_x3": 70.0,
"r_y3": 550.6,
"coord_origin": "TOPLEFT"
},
"text": "ture derivation. In",
"orig": "ture derivation. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.8,
"r_y0": 558.4,
"r_x1": 286.4,
"r_y1": 558.4,
"r_x2": 286.4,
"r_y2": 550.6,
"r_x3": 138.8,
"r_y3": 550.6,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the Seventh International",
"orig": "Proceedings of the Seventh International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 569.3,
"r_x1": 286.4,
"r_y1": 569.3,
"r_x2": 286.4,
"r_y2": 561.6,
"r_x3": 70.0,
"r_y3": 561.6,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Document Analysis and Recognition - Volume",
"orig": "Conference on Document Analysis and Recognition - Volume",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 580.3,
"r_x1": 74.5,
"r_y1": 580.3,
"r_x2": 74.5,
"r_y2": 572.6,
"r_x3": 70.0,
"r_y3": 572.6,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.5,
"r_y0": 580.5,
"r_x1": 286.4,
"r_y1": 580.5,
"r_x2": 286.4,
"r_y2": 572.5,
"r_x3": 74.5,
"r_y3": 572.5,
"coord_origin": "TOPLEFT"
},
"text": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-",
"orig": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 591.4,
"r_x1": 90.4,
"r_y1": 591.4,
"r_x2": 90.4,
"r_y2": 583.4,
"r_x3": 70.0,
"r_y3": 583.4,
"coord_origin": "TOPLEFT"
},
"text": "ety. 2",
"orig": "ety. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 602.7,
"r_x1": 66.3,
"r_y1": 602.7,
"r_x2": 66.3,
"r_y2": 594.7,
"r_x3": 50.1,
"r_y3": 594.7,
"coord_origin": "TOPLEFT"
},
"text": "[13]",
"orig": "[13]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.7,
"r_y0": 602.7,
"r_x1": 286.4,
"r_y1": 602.7,
"r_x2": 286.4,
"r_y2": 594.7,
"r_x3": 68.7,
"r_y3": 594.7,
"coord_origin": "TOPLEFT"
},
"text": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,",
"orig": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 613.7,
"r_x1": 286.4,
"r_y1": 613.7,
"r_x2": 286.4,
"r_y2": 605.7,
"r_x3": 70.0,
"r_y3": 605.7,
"coord_origin": "TOPLEFT"
},
"text": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect",
"orig": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 624.6,
"r_x1": 286.4,
"r_y1": 624.6,
"r_x2": 286.4,
"r_y2": 616.6,
"r_x3": 70.0,
"r_y3": 616.6,
"coord_origin": "TOPLEFT"
},
"text": "tables in scanned document images using line information.",
"orig": "tables in scanned document images using line information.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 635.6,
"r_x1": 77.5,
"r_y1": 635.6,
"r_x2": 77.5,
"r_y2": 627.6,
"r_x3": 70.0,
"r_y3": 627.6,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 79.9,
"r_y0": 635.4,
"r_x1": 286.4,
"r_y1": 635.4,
"r_x2": 286.4,
"r_y2": 627.7,
"r_x3": 79.9,
"r_y3": 627.7,
"coord_origin": "TOPLEFT"
},
"text": "2013 12th International Conference on Document Analy-",
"orig": "2013 12th International Conference on Document Analy-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 646.4,
"r_x1": 140.7,
"r_y1": 646.4,
"r_x2": 140.7,
"r_y2": 638.6,
"r_x3": 70.0,
"r_y3": 638.6,
"coord_origin": "TOPLEFT"
},
"text": "sis and Recognition",
"orig": "sis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.7,
"r_y0": 646.6,
"r_x1": 264.4,
"r_y1": 646.6,
"r_x2": 264.4,
"r_y2": 638.5,
"r_x3": 140.7,
"r_y3": 638.5,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1185-1189. IEEE, 2013. 2",
"orig": ", pages 1185-1189. IEEE, 2013. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 657.8,
"r_x1": 66.5,
"r_y1": 657.8,
"r_x2": 66.5,
"r_y2": 649.8,
"r_x3": 50.1,
"r_y3": 649.8,
"coord_origin": "TOPLEFT"
},
"text": "[14]",
"orig": "[14]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 69.0,
"r_y0": 657.8,
"r_x1": 286.4,
"r_y1": 657.8,
"r_x2": 286.4,
"r_y2": 649.8,
"r_x3": 69.0,
"r_y3": 649.8,
"coord_origin": "TOPLEFT"
},
"text": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank",
"orig": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 668.8,
"r_x1": 93.2,
"r_y1": 668.8,
"r_x2": 93.2,
"r_y2": 660.8,
"r_x3": 70.0,
"r_y3": 660.8,
"coord_origin": "TOPLEFT"
},
"text": "Singh.",
"orig": "Singh.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 102.2,
"r_y0": 668.8,
"r_x1": 286.4,
"r_y1": 668.8,
"r_x2": 286.4,
"r_y2": 660.8,
"r_x3": 102.2,
"r_y3": 660.8,
"coord_origin": "TOPLEFT"
},
"text": "Icdar 2021 competition on scientific table image",
"orig": "Icdar 2021 competition on scientific table image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 679.7,
"r_x1": 172.0,
"r_y1": 679.7,
"r_x2": 172.0,
"r_y2": 671.7,
"r_x3": 70.0,
"r_y3": 671.7,
"coord_origin": "TOPLEFT"
},
"text": "recognition to latex, 2021. 2",
"orig": "recognition to latex, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 691.0,
"r_x1": 65.5,
"r_y1": 691.0,
"r_x2": 65.5,
"r_y2": 683.0,
"r_x3": 50.1,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "[15]",
"orig": "[15]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 691.0,
"r_x1": 286.4,
"r_y1": 691.0,
"r_x2": 286.4,
"r_y2": 683.0,
"r_x3": 67.8,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Harold W Kuhn. The hungarian method for the assignment",
"orig": "Harold W Kuhn. The hungarian method for the assignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 702.0,
"r_x1": 102.2,
"r_y1": 702.0,
"r_x2": 102.2,
"r_y2": 694.0,
"r_x3": 70.0,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "problem.",
"orig": "problem.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 107.5,
"r_y0": 701.8,
"r_x1": 231.5,
"r_y1": 701.8,
"r_x2": 231.5,
"r_y2": 694.0,
"r_x3": 107.5,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Naval research logistics quarterly",
"orig": "Naval research logistics quarterly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 231.5,
"r_y0": 702.0,
"r_x1": 286.4,
"r_y1": 702.0,
"r_x2": 286.4,
"r_y2": 694.0,
"r_x3": 231.5,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": ", 2(1-2):83-97,",
"orig": ", 2(1-2):83-97,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 712.9,
"r_x1": 97.9,
"r_y1": 712.9,
"r_x2": 97.9,
"r_y2": 704.9,
"r_x3": 70.0,
"r_y3": 704.9,
"coord_origin": "TOPLEFT"
},
"text": "1955. 6",
"orig": "1955. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 83.9,
"r_x1": 324.7,
"r_y1": 83.9,
"r_x2": 324.7,
"r_y2": 75.9,
"r_x3": 308.9,
"r_y3": 75.9,
"coord_origin": "TOPLEFT"
},
"text": "[16]",
"orig": "[16]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.1,
"r_y0": 83.9,
"r_x1": 545.1,
"r_y1": 83.9,
"r_x2": 545.1,
"r_y2": 75.9,
"r_x3": 327.1,
"r_y3": 75.9,
"coord_origin": "TOPLEFT"
},
"text": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-",
"orig": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 94.9,
"r_x1": 545.1,
"r_y1": 94.9,
"r_x2": 545.1,
"r_y2": 86.8,
"r_x3": 328.8,
"r_y3": 86.8,
"coord_origin": "TOPLEFT"
},
"text": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and",
"orig": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 105.8,
"r_x1": 391.0,
"r_y1": 105.8,
"r_x2": 391.0,
"r_y2": 97.8,
"r_x3": 328.8,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Tamara L. Berg.",
"orig": "Tamara L. Berg.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.3,
"r_y0": 105.8,
"r_x1": 435.1,
"r_y1": 105.8,
"r_x2": 435.1,
"r_y2": 97.8,
"r_x3": 400.3,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Babytalk:",
"orig": "Babytalk:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.7,
"r_y0": 105.8,
"r_x1": 545.1,
"r_y1": 105.8,
"r_x2": 545.1,
"r_y2": 97.8,
"r_x3": 441.7,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Understanding and generat-",
"orig": "Understanding and generat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 116.8,
"r_x1": 440.8,
"r_y1": 116.8,
"r_x2": 440.8,
"r_y2": 108.8,
"r_x3": 328.8,
"r_y3": 108.8,
"coord_origin": "TOPLEFT"
},
"text": "ing simple image descriptions.",
"orig": "ing simple image descriptions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 446.6,
"r_y0": 116.6,
"r_x1": 545.1,
"r_y1": 116.6,
"r_x2": 545.1,
"r_y2": 108.8,
"r_x3": 446.6,
"r_y3": 108.8,
"coord_origin": "TOPLEFT"
},
"text": "IEEE Transactions on Pat-",
"orig": "IEEE Transactions on Pat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 127.5,
"r_x1": 471.1,
"r_y1": 127.5,
"r_x2": 471.1,
"r_y2": 119.8,
"r_x3": 328.8,
"r_y3": 119.8,
"coord_origin": "TOPLEFT"
},
"text": "tern Analysis and Machine Intelligence",
"orig": "tern Analysis and Machine Intelligence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 471.1,
"r_y0": 127.7,
"r_x1": 545.1,
"r_y1": 127.7,
"r_x2": 545.1,
"r_y2": 119.7,
"r_x3": 471.1,
"r_y3": 119.7,
"coord_origin": "TOPLEFT"
},
"text": ", 35(12):2891-2903,",
"orig": ", 35(12):2891-2903,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 138.7,
"r_x1": 356.7,
"r_y1": 138.7,
"r_x2": 356.7,
"r_y2": 130.7,
"r_x3": 328.8,
"r_y3": 130.7,
"coord_origin": "TOPLEFT"
},
"text": "2013. 4",
"orig": "2013. 4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 150.1,
"r_x1": 325.2,
"r_y1": 150.1,
"r_x2": 325.2,
"r_y2": 142.1,
"r_x3": 308.9,
"r_y3": 142.1,
"coord_origin": "TOPLEFT"
},
"text": "[17]",
"orig": "[17]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.7,
"r_y0": 150.1,
"r_x1": 545.1,
"r_y1": 150.1,
"r_x2": 545.1,
"r_y2": 142.1,
"r_x3": 327.7,
"r_y3": 142.1,
"coord_origin": "TOPLEFT"
},
"text": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming",
"orig": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 161.1,
"r_x1": 414.4,
"r_y1": 161.1,
"r_x2": 414.4,
"r_y2": 153.1,
"r_x3": 328.8,
"r_y3": 153.1,
"coord_origin": "TOPLEFT"
},
"text": "Zhou, and Zhoujun Li.",
"orig": "Zhou, and Zhoujun Li.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 421.8,
"r_y0": 161.1,
"r_x1": 545.1,
"r_y1": 161.1,
"r_x2": 545.1,
"r_y2": 153.1,
"r_x3": 421.8,
"r_y3": 153.1,
"coord_origin": "TOPLEFT"
},
"text": "Tablebank: A benchmark dataset",
"orig": "Tablebank: A benchmark dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 172.1,
"r_x1": 493.6,
"r_y1": 172.1,
"r_x2": 493.6,
"r_y2": 164.0,
"r_x3": 328.8,
"r_y3": 164.0,
"coord_origin": "TOPLEFT"
},
"text": "for table detection and recognition, 2019. 2, 3",
"orig": "for table detection and recognition, 2019. 2, 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 183.5,
"r_x1": 324.3,
"r_y1": 183.5,
"r_x2": 324.3,
"r_y2": 175.5,
"r_x3": 308.9,
"r_y3": 175.5,
"coord_origin": "TOPLEFT"
},
"text": "[18]",
"orig": "[18]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.6,
"r_y0": 183.5,
"r_x1": 545.1,
"r_y1": 183.5,
"r_x2": 545.1,
"r_y2": 175.5,
"r_x3": 326.6,
"r_y3": 175.5,
"coord_origin": "TOPLEFT"
},
"text": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and",
"orig": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 194.5,
"r_x1": 545.1,
"r_y1": 194.5,
"r_x2": 545.1,
"r_y2": 186.4,
"r_x3": 328.8,
"r_y3": 186.4,
"coord_origin": "TOPLEFT"
},
"text": "Xianhui Liu. Gfte: Graph-based financial table extraction.",
"orig": "Xianhui Liu. Gfte: Graph-based financial table extraction.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 205.4,
"r_x1": 545.1,
"r_y1": 205.4,
"r_x2": 545.1,
"r_y2": 197.4,
"r_x3": 328.8,
"r_y3": 197.4,
"coord_origin": "TOPLEFT"
},
"text": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-",
"orig": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 216.4,
"r_x1": 545.1,
"r_y1": 216.4,
"r_x2": 545.1,
"r_y2": 208.4,
"r_x3": 328.8,
"r_y3": 208.4,
"coord_origin": "TOPLEFT"
},
"text": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair",
"orig": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 227.3,
"r_x1": 479.3,
"r_y1": 227.3,
"r_x2": 479.3,
"r_y2": 219.3,
"r_x3": 328.8,
"r_y3": 219.3,
"coord_origin": "TOPLEFT"
},
"text": "Escalante, and Roberto Vezzani, editors,",
"orig": "Escalante, and Roberto Vezzani, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.1,
"r_y0": 227.1,
"r_x1": 545.1,
"r_y1": 227.1,
"r_x2": 545.1,
"r_y2": 219.4,
"r_x3": 483.1,
"r_y3": 219.4,
"coord_origin": "TOPLEFT"
},
"text": "Pattern Recogni-",
"orig": "Pattern Recogni-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 238.1,
"r_x1": 519.4,
"r_y1": 238.1,
"r_x2": 519.4,
"r_y2": 230.4,
"r_x3": 328.8,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "tion. ICPR International Workshops and Challenges",
"orig": "tion. ICPR International Workshops and Challenges",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 519.4,
"r_y0": 238.3,
"r_x1": 545.1,
"r_y1": 238.3,
"r_x2": 545.1,
"r_y2": 230.3,
"r_x3": 519.4,
"r_y3": 230.3,
"coord_origin": "TOPLEFT"
},
"text": ", pages",
"orig": ", pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 249.3,
"r_x1": 545.1,
"r_y1": 249.3,
"r_x2": 545.1,
"r_y2": 241.2,
"r_x3": 328.8,
"r_y3": 241.2,
"coord_origin": "TOPLEFT"
},
"text": "644-658, Cham, 2021. Springer International Publishing. 2,",
"orig": "644-658, Cham, 2021. Springer International Publishing. 2,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 260.2,
"r_x1": 333.3,
"r_y1": 260.2,
"r_x2": 333.3,
"r_y2": 252.2,
"r_x3": 328.8,
"r_y3": 252.2,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 271.7,
"r_x1": 324.3,
"r_y1": 271.7,
"r_x2": 324.3,
"r_y2": 263.6,
"r_x3": 308.9,
"r_y3": 263.6,
"coord_origin": "TOPLEFT"
},
"text": "[19]",
"orig": "[19]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.6,
"r_y0": 271.7,
"r_x1": 545.1,
"r_y1": 271.7,
"r_x2": 545.1,
"r_y2": 263.6,
"r_x3": 326.6,
"r_y3": 263.6,
"coord_origin": "TOPLEFT"
},
"text": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-",
"orig": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 282.6,
"r_x1": 545.1,
"r_y1": 282.6,
"r_x2": 545.1,
"r_y2": 274.6,
"r_x3": 328.8,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele",
"orig": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 293.6,
"r_x1": 545.1,
"r_y1": 293.6,
"r_x2": 545.1,
"r_y2": 285.6,
"r_x3": 328.8,
"r_y3": 285.6,
"coord_origin": "TOPLEFT"
},
"text": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-",
"orig": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 304.5,
"r_x1": 545.1,
"r_y1": 304.5,
"r_x2": 545.1,
"r_y2": 296.5,
"r_x3": 328.8,
"r_y3": 296.5,
"coord_origin": "TOPLEFT"
},
"text": "bust pdf document conversion using recurrent neural net-",
"orig": "bust pdf document conversion using recurrent neural net-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 315.5,
"r_x1": 352.8,
"r_y1": 315.5,
"r_x2": 352.8,
"r_y2": 307.5,
"r_x3": 328.8,
"r_y3": 307.5,
"coord_origin": "TOPLEFT"
},
"text": "works.",
"orig": "works.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.2,
"r_y0": 315.3,
"r_x1": 545.1,
"r_y1": 315.3,
"r_x2": 545.1,
"r_y2": 307.6,
"r_x3": 360.2,
"r_y3": 307.6,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the AAAI Conference on Artificial",
"orig": "Proceedings of the AAAI Conference on Artificial",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 326.2,
"r_x1": 371.0,
"r_y1": 326.2,
"r_x2": 371.0,
"r_y2": 318.5,
"r_x3": 328.8,
"r_y3": 318.5,
"coord_origin": "TOPLEFT"
},
"text": "Intelligence",
"orig": "Intelligence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 371.0,
"r_y0": 326.5,
"r_x1": 502.3,
"r_y1": 326.5,
"r_x2": 502.3,
"r_y2": 318.4,
"r_x3": 371.0,
"r_y3": 318.4,
"coord_origin": "TOPLEFT"
},
"text": ", 35(17):15137-15145, May 2021. 1",
"orig": ", 35(17):15137-15145, May 2021. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 337.9,
"r_x1": 323.8,
"r_y1": 337.9,
"r_x2": 323.8,
"r_y2": 329.9,
"r_x3": 308.9,
"r_y3": 329.9,
"coord_origin": "TOPLEFT"
},
"text": "[20]",
"orig": "[20]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.1,
"r_y0": 337.9,
"r_x1": 545.1,
"r_y1": 337.9,
"r_x2": 545.1,
"r_y2": 329.9,
"r_x3": 326.1,
"r_y3": 329.9,
"coord_origin": "TOPLEFT"
},
"text": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,",
"orig": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 348.9,
"r_x1": 545.1,
"r_y1": 348.9,
"r_x2": 545.1,
"r_y2": 340.8,
"r_x3": 328.8,
"r_y3": 340.8,
"coord_origin": "TOPLEFT"
},
"text": "Yongpan Wang, and Gui-Song Xia. Parsing table structures",
"orig": "Yongpan Wang, and Gui-Song Xia. Parsing table structures",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 359.8,
"r_x1": 382.8,
"r_y1": 359.8,
"r_x2": 382.8,
"r_y2": 351.8,
"r_x3": 328.8,
"r_y3": 351.8,
"coord_origin": "TOPLEFT"
},
"text": "in the wild. In",
"orig": "in the wild. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.5,
"r_y0": 359.6,
"r_x1": 545.1,
"r_y1": 359.6,
"r_x2": 545.1,
"r_y2": 351.9,
"r_x3": 385.5,
"r_y3": 351.9,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF International",
"orig": "Proceedings of the IEEE/CVF International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 370.6,
"r_x1": 443.6,
"r_y1": 370.6,
"r_x2": 443.6,
"r_y2": 362.8,
"r_x3": 328.8,
"r_y3": 362.8,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision",
"orig": "Conference on Computer Vision",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 443.6,
"r_y0": 370.8,
"r_x1": 534.5,
"r_y1": 370.8,
"r_x2": 534.5,
"r_y2": 362.8,
"r_x3": 443.6,
"r_y3": 362.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 944-952, 2021. 2",
"orig": ", pages 944-952, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 382.2,
"r_x1": 324.6,
"r_y1": 382.2,
"r_x2": 324.6,
"r_y2": 374.2,
"r_x3": 308.9,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "[21]",
"orig": "[21]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.0,
"r_y0": 382.2,
"r_x1": 362.7,
"r_y1": 382.2,
"r_x2": 362.7,
"r_y2": 374.2,
"r_x3": 327.0,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Shubham",
"orig": "Shubham",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 368.7,
"r_y0": 382.2,
"r_x1": 389.6,
"r_y1": 382.2,
"r_x2": 389.6,
"r_y2": 374.2,
"r_x3": 368.7,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Singh",
"orig": "Singh",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 395.6,
"r_y0": 382.2,
"r_x1": 424.6,
"r_y1": 382.2,
"r_x2": 424.6,
"r_y2": 374.2,
"r_x3": 395.6,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Paliwal,",
"orig": "Paliwal,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.5,
"r_y0": 382.2,
"r_x1": 438.0,
"r_y1": 382.2,
"r_x2": 438.0,
"r_y2": 374.2,
"r_x3": 431.5,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "D",
"orig": "D",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 444.1,
"r_y0": 382.2,
"r_x1": 488.5,
"r_y1": 382.2,
"r_x2": 488.5,
"r_y2": 374.2,
"r_x3": 444.1,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Vishwanath,",
"orig": "Vishwanath,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 495.5,
"r_y0": 382.2,
"r_x1": 515.4,
"r_y1": 382.2,
"r_x2": 515.4,
"r_y2": 374.2,
"r_x3": 495.5,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Rohit",
"orig": "Rohit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 521.4,
"r_y0": 382.2,
"r_x1": 545.1,
"r_y1": 382.2,
"r_x2": 545.1,
"r_y2": 374.2,
"r_x3": 521.4,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Rahul,",
"orig": "Rahul,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 393.2,
"r_x1": 545.1,
"r_y1": 393.2,
"r_x2": 545.1,
"r_y2": 385.2,
"r_x3": 328.8,
"r_y3": 385.2,
"coord_origin": "TOPLEFT"
},
"text": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-",
"orig": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 404.1,
"r_x1": 545.1,
"r_y1": 404.1,
"r_x2": 545.1,
"r_y2": 396.1,
"r_x3": 328.8,
"r_y3": 396.1,
"coord_origin": "TOPLEFT"
},
"text": "ing model for end-to-end table detection and tabular data ex-",
"orig": "ing model for end-to-end table detection and tabular data ex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 415.1,
"r_x1": 478.0,
"r_y1": 415.1,
"r_x2": 478.0,
"r_y2": 407.1,
"r_x3": 328.8,
"r_y3": 407.1,
"coord_origin": "TOPLEFT"
},
"text": "traction from scanned document images.",
"orig": "traction from scanned document images.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 484.1,
"r_y0": 415.1,
"r_x1": 491.5,
"r_y1": 415.1,
"r_x2": 491.5,
"r_y2": 407.1,
"r_x3": 484.1,
"r_y3": 407.1,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 494.7,
"r_y0": 414.9,
"r_x1": 545.1,
"r_y1": 414.9,
"r_x2": 545.1,
"r_y2": 407.2,
"r_x3": 494.7,
"r_y3": 407.2,
"coord_origin": "TOPLEFT"
},
"text": "2019 Interna-",
"orig": "2019 Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 425.9,
"r_x1": 545.1,
"r_y1": 425.9,
"r_x2": 545.1,
"r_y2": 418.1,
"r_x3": 328.8,
"r_y3": 418.1,
"coord_origin": "TOPLEFT"
},
"text": "tional Conference on Document Analysis and Recognition",
"orig": "tional Conference on Document Analysis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 436.8,
"r_x1": 360.8,
"r_y1": 436.8,
"r_x2": 360.8,
"r_y2": 429.1,
"r_x3": 328.8,
"r_y3": 429.1,
"coord_origin": "TOPLEFT"
},
"text": "(ICDAR)",
"orig": "(ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.8,
"r_y0": 437.0,
"r_x1": 475.6,
"r_y1": 437.0,
"r_x2": 475.6,
"r_y2": 429.0,
"r_x3": 360.8,
"r_y3": 429.0,
"coord_origin": "TOPLEFT"
},
"text": ", pages 128-133. IEEE, 2019. 1",
"orig": ", pages 128-133. IEEE, 2019. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 448.5,
"r_x1": 324.6,
"r_y1": 448.5,
"r_x2": 324.6,
"r_y2": 440.4,
"r_x3": 308.9,
"r_y3": 440.4,
"coord_origin": "TOPLEFT"
},
"text": "[22]",
"orig": "[22]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.9,
"r_y0": 448.5,
"r_x1": 545.1,
"r_y1": 448.5,
"r_x2": 545.1,
"r_y2": 440.4,
"r_x3": 326.9,
"r_y3": 440.4,
"coord_origin": "TOPLEFT"
},
"text": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,",
"orig": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 459.4,
"r_x1": 545.1,
"r_y1": 459.4,
"r_x2": 545.1,
"r_y2": 451.4,
"r_x3": 328.8,
"r_y3": 451.4,
"coord_origin": "TOPLEFT"
},
"text": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming",
"orig": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 470.4,
"r_x1": 545.1,
"r_y1": 470.4,
"r_x2": 545.1,
"r_y2": 462.4,
"r_x3": 328.8,
"r_y3": 462.4,
"coord_origin": "TOPLEFT"
},
"text": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,",
"orig": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 481.3,
"r_x1": 545.1,
"r_y1": 481.3,
"r_x2": 545.1,
"r_y2": 473.3,
"r_x3": 328.8,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-",
"orig": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 492.3,
"r_x1": 545.1,
"r_y1": 492.3,
"r_x2": 545.1,
"r_y2": 484.3,
"r_x3": 328.8,
"r_y3": 484.3,
"coord_origin": "TOPLEFT"
},
"text": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,",
"orig": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 503.3,
"r_x1": 545.1,
"r_y1": 503.3,
"r_x2": 545.1,
"r_y2": 495.2,
"r_x3": 328.8,
"r_y3": 495.2,
"coord_origin": "TOPLEFT"
},
"text": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-",
"orig": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 514.2,
"r_x1": 545.1,
"r_y1": 514.2,
"r_x2": 545.1,
"r_y2": 506.2,
"r_x3": 328.8,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "perative style, high-performance deep learning library. In H.",
"orig": "perative style, high-performance deep learning library. In H.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 525.2,
"r_x1": 545.1,
"r_y1": 525.2,
"r_x2": 545.1,
"r_y2": 517.2,
"r_x3": 328.8,
"r_y3": 517.2,
"coord_origin": "TOPLEFT"
},
"text": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.",
"orig": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 536.1,
"r_x1": 434.6,
"r_y1": 536.1,
"r_x2": 434.6,
"r_y2": 528.1,
"r_x3": 328.8,
"r_y3": 528.1,
"coord_origin": "TOPLEFT"
},
"text": "Fox, and R. Garnett, editors,",
"orig": "Fox, and R. Garnett, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.9,
"r_y0": 535.9,
"r_x1": 545.1,
"r_y1": 535.9,
"r_x2": 545.1,
"r_y2": 528.2,
"r_x3": 437.9,
"r_y3": 528.2,
"coord_origin": "TOPLEFT"
},
"text": "Advances in Neural Informa-",
"orig": "Advances in Neural Informa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 546.9,
"r_x1": 425.7,
"r_y1": 546.9,
"r_x2": 425.7,
"r_y2": 539.2,
"r_x3": 328.8,
"r_y3": 539.2,
"coord_origin": "TOPLEFT"
},
"text": "tion Processing Systems 32",
"orig": "tion Processing Systems 32",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 425.7,
"r_y0": 547.1,
"r_x1": 545.1,
"r_y1": 547.1,
"r_x2": 545.1,
"r_y2": 539.1,
"r_x3": 425.7,
"r_y3": 539.1,
"coord_origin": "TOPLEFT"
},
"text": ", pages 8024-8035. Curran Asso-",
"orig": ", pages 8024-8035. Curran Asso-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 558.1,
"r_x1": 399.7,
"r_y1": 558.1,
"r_x2": 399.7,
"r_y2": 550.0,
"r_x3": 328.8,
"r_y3": 550.0,
"coord_origin": "TOPLEFT"
},
"text": "ciates, Inc., 2019. 6",
"orig": "ciates, Inc., 2019. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 569.5,
"r_x1": 324.5,
"r_y1": 569.5,
"r_x2": 324.5,
"r_y2": 561.5,
"r_x3": 308.9,
"r_y3": 561.5,
"coord_origin": "TOPLEFT"
},
"text": "[23]",
"orig": "[23]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.9,
"r_y0": 569.5,
"r_x1": 545.1,
"r_y1": 569.5,
"r_x2": 545.1,
"r_y2": 561.5,
"r_x3": 326.9,
"r_y3": 561.5,
"coord_origin": "TOPLEFT"
},
"text": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish",
"orig": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 580.5,
"r_x1": 545.1,
"r_y1": 580.5,
"r_x2": 545.1,
"r_y2": 572.4,
"r_x3": 328.8,
"r_y3": 572.4,
"coord_origin": "TOPLEFT"
},
"text": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach",
"orig": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 591.4,
"r_x1": 545.1,
"r_y1": 591.4,
"r_x2": 545.1,
"r_y2": 583.4,
"r_x3": 328.8,
"r_y3": 583.4,
"coord_origin": "TOPLEFT"
},
"text": "for end to end table detection and structure recognition from",
"orig": "for end to end table detection and structure recognition from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 602.4,
"r_x1": 431.6,
"r_y1": 602.4,
"r_x2": 431.6,
"r_y2": 594.4,
"r_x3": 328.8,
"r_y3": 594.4,
"coord_origin": "TOPLEFT"
},
"text": "image-based documents. In",
"orig": "image-based documents. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 434.7,
"r_y0": 602.2,
"r_x1": 545.1,
"r_y1": 602.2,
"r_x2": 545.1,
"r_y2": 594.4,
"r_x3": 434.7,
"r_y3": 594.4,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF",
"orig": "Proceedings of the IEEE/CVF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 613.1,
"r_x1": 545.1,
"r_y1": 613.1,
"r_x2": 545.1,
"r_y2": 605.4,
"r_x3": 328.8,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision and Pattern Recognition",
"orig": "Conference on Computer Vision and Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 624.1,
"r_x1": 367.8,
"r_y1": 624.1,
"r_x2": 367.8,
"r_y2": 616.4,
"r_x3": 328.8,
"r_y3": 616.4,
"coord_origin": "TOPLEFT"
},
"text": "Workshops",
"orig": "Workshops",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.8,
"r_y0": 624.3,
"r_x1": 458.7,
"r_y1": 624.3,
"r_x2": 458.7,
"r_y2": 616.3,
"r_x3": 367.8,
"r_y3": 616.3,
"coord_origin": "TOPLEFT"
},
"text": ", pages 572-573, 2020. 1",
"orig": ", pages 572-573, 2020. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 635.7,
"r_x1": 324.7,
"r_y1": 635.7,
"r_x2": 324.7,
"r_y2": 627.7,
"r_x3": 308.9,
"r_y3": 627.7,
"coord_origin": "TOPLEFT"
},
"text": "[24]",
"orig": "[24]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.1,
"r_y0": 635.7,
"r_x1": 545.1,
"r_y1": 635.7,
"r_x2": 545.1,
"r_y2": 627.7,
"r_x3": 327.1,
"r_y3": 627.7,
"coord_origin": "TOPLEFT"
},
"text": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.",
"orig": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 646.7,
"r_x1": 545.1,
"r_y1": 646.7,
"r_x2": 545.1,
"r_y2": 638.7,
"r_x3": 328.8,
"r_y3": 638.7,
"coord_origin": "TOPLEFT"
},
"text": "Rethinking table recognition using graph neural networks.",
"orig": "Rethinking table recognition using graph neural networks.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 657.7,
"r_x1": 336.3,
"r_y1": 657.7,
"r_x2": 336.3,
"r_y2": 649.6,
"r_x3": 328.8,
"r_y3": 649.6,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 338.1,
"r_y0": 657.4,
"r_x1": 545.1,
"r_y1": 657.4,
"r_x2": 545.1,
"r_y2": 649.7,
"r_x3": 338.1,
"r_y3": 649.7,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 668.4,
"r_x1": 406.3,
"r_y1": 668.4,
"r_x2": 406.3,
"r_y2": 660.7,
"r_x3": 328.8,
"r_y3": 660.7,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.3,
"r_y0": 668.6,
"r_x1": 521.1,
"r_y1": 668.6,
"r_x2": 521.1,
"r_y2": 660.6,
"r_x3": 406.3,
"r_y3": 660.6,
"coord_origin": "TOPLEFT"
},
"text": ", pages 142-147. IEEE, 2019. 3",
"orig": ", pages 142-147. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 680.1,
"r_x1": 324.7,
"r_y1": 680.1,
"r_x2": 324.7,
"r_y2": 672.0,
"r_x3": 308.9,
"r_y3": 672.0,
"coord_origin": "TOPLEFT"
},
"text": "[25]",
"orig": "[25]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.1,
"r_y0": 680.1,
"r_x1": 545.1,
"r_y1": 680.1,
"r_x2": 545.1,
"r_y2": 672.0,
"r_x3": 327.1,
"r_y3": 672.0,
"coord_origin": "TOPLEFT"
},
"text": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir",
"orig": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 691.0,
"r_x1": 482.8,
"r_y1": 691.0,
"r_x2": 482.8,
"r_y2": 683.0,
"r_x3": 328.8,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Sadeghian, Ian Reid, and Silvio Savarese.",
"orig": "Sadeghian, Ian Reid, and Silvio Savarese.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.8,
"r_y0": 691.0,
"r_x1": 545.1,
"r_y1": 691.0,
"r_x2": 545.1,
"r_y2": 683.0,
"r_x3": 488.8,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Generalized in-",
"orig": "Generalized in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 702.0,
"r_x1": 545.1,
"r_y1": 702.0,
"r_x2": 545.1,
"r_y2": 694.0,
"r_x3": 328.8,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "tersection over union: A metric and a loss for bounding box",
"orig": "tersection over union: A metric and a loss for bounding box",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 712.9,
"r_x1": 379.2,
"r_y1": 712.9,
"r_x2": 379.2,
"r_y2": 704.9,
"r_x3": 328.8,
"r_y3": 704.9,
"coord_origin": "TOPLEFT"
},
"text": "regression. In",
"orig": "regression. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 381.6,
"r_y0": 712.7,
"r_x1": 545.1,
"r_y1": 712.7,
"r_x2": 545.1,
"r_y2": 705.0,
"r_x3": 381.6,
"r_y3": 705.0,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF Conference on",
"orig": "Proceedings of the IEEE/CVF Conference on",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 25,
"label": "list_item",
"bbox": {
"l": 70.0,
"t": 75.9,
"r": 286.4,
"b": 116.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.73,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 83.9,
"r_x1": 286.4,
"r_y1": 83.9,
"r_x2": 286.4,
"r_y2": 75.9,
"r_x3": 70.0,
"r_y3": 75.9,
"coord_origin": "TOPLEFT"
},
"text": "end object detection with transformers. In Andrea Vedaldi,",
"orig": "end object detection with transformers. In Andrea Vedaldi,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 94.9,
"r_x1": 286.4,
"r_y1": 94.9,
"r_x2": 286.4,
"r_y2": 86.8,
"r_x3": 70.0,
"r_y3": 86.8,
"coord_origin": "TOPLEFT"
},
"text": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-",
"orig": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 105.8,
"r_x1": 85.7,
"r_y1": 105.8,
"r_x2": 85.7,
"r_y2": 97.8,
"r_x3": 70.0,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "tors,",
"orig": "tors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 87.9,
"r_y0": 105.6,
"r_x1": 199.9,
"r_y1": 105.6,
"r_x2": 199.9,
"r_y2": 97.9,
"r_x3": 87.9,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision - ECCV 2020",
"orig": "Computer Vision - ECCV 2020",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 199.9,
"r_y0": 105.8,
"r_x1": 286.4,
"r_y1": 105.8,
"r_x2": 286.4,
"r_y2": 97.8,
"r_x3": 199.9,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 213-229, Cham,",
"orig": ", pages 213-229, Cham,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 116.8,
"r_x1": 221.9,
"r_y1": 116.8,
"r_x2": 221.9,
"r_y2": 108.8,
"r_x3": 70.0,
"r_y3": 108.8,
"coord_origin": "TOPLEFT"
},
"text": "2020. Springer International Publishing. 5",
"orig": "2020. Springer International Publishing. 5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 9,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 120.0,
"r": 286.4,
"b": 150.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 128.0,
"r_x1": 65.2,
"r_y1": 128.0,
"r_x2": 65.2,
"r_y2": 120.0,
"r_x3": 54.6,
"r_y3": 120.0,
"coord_origin": "TOPLEFT"
},
"text": "[2]",
"orig": "[2]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.5,
"r_y0": 128.0,
"r_x1": 286.4,
"r_y1": 128.0,
"r_x2": 286.4,
"r_y2": 120.0,
"r_x3": 67.5,
"r_y3": 120.0,
"coord_origin": "TOPLEFT"
},
"text": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-",
"orig": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 139.0,
"r_x1": 179.7,
"r_y1": 139.0,
"r_x2": 179.7,
"r_y2": 131.0,
"r_x3": 70.0,
"r_y3": 131.0,
"coord_origin": "TOPLEFT"
},
"text": "uan Yin, and Xian-Ling Mao.",
"orig": "uan Yin, and Xian-Ling Mao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.6,
"r_y0": 139.0,
"r_x1": 286.4,
"r_y1": 139.0,
"r_x2": 286.4,
"r_y2": 131.0,
"r_x3": 185.6,
"r_y3": 131.0,
"coord_origin": "TOPLEFT"
},
"text": "Complicated table structure",
"orig": "Complicated table structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 150.0,
"r_x1": 113.1,
"r_y1": 150.0,
"r_x2": 113.1,
"r_y2": 141.9,
"r_x3": 70.0,
"r_y3": 141.9,
"coord_origin": "TOPLEFT"
},
"text": "recognition.",
"orig": "recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.3,
"r_y0": 149.8,
"r_x1": 235.3,
"r_y1": 149.8,
"r_x2": 235.3,
"r_y2": 142.0,
"r_x3": 116.3,
"r_y3": 142.0,
"coord_origin": "TOPLEFT"
},
"text": "arXiv preprint arXiv:1908.04729",
"orig": "arXiv preprint arXiv:1908.04729",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 235.3,
"r_y0": 150.0,
"r_x1": 267.7,
"r_y1": 150.0,
"r_x2": 267.7,
"r_y2": 141.9,
"r_x3": 235.3,
"r_y3": 141.9,
"coord_origin": "TOPLEFT"
},
"text": ", 2019. 3",
"orig": ", 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 7,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 153.2,
"r": 286.4,
"b": 183.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 161.2,
"r_x1": 65.1,
"r_y1": 161.2,
"r_x2": 65.1,
"r_y2": 153.2,
"r_x3": 54.6,
"r_y3": 153.2,
"coord_origin": "TOPLEFT"
},
"text": "[3]",
"orig": "[3]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.4,
"r_y0": 161.2,
"r_x1": 218.8,
"r_y1": 161.2,
"r_x2": 218.8,
"r_y2": 153.2,
"r_x3": 67.4,
"r_y3": 153.2,
"coord_origin": "TOPLEFT"
},
"text": "Bertrand Couasnon and Aurelie Lemaitre.",
"orig": "Bertrand Couasnon and Aurelie Lemaitre.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 221.0,
"r_y0": 161.0,
"r_x1": 286.4,
"r_y1": 161.0,
"r_x2": 286.4,
"r_y2": 153.3,
"r_x3": 221.0,
"r_y3": 153.3,
"coord_origin": "TOPLEFT"
},
"text": "Recognition of Ta-",
"orig": "Recognition of Ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 172.0,
"r_x1": 125.3,
"r_y1": 172.0,
"r_x2": 125.3,
"r_y2": 164.3,
"r_x3": 70.0,
"r_y3": 164.3,
"coord_origin": "TOPLEFT"
},
"text": "bles and Forms",
"orig": "bles and Forms",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.3,
"r_y0": 172.2,
"r_x1": 286.4,
"r_y1": 172.2,
"r_x2": 286.4,
"r_y2": 164.2,
"r_x3": 125.3,
"r_y3": 164.2,
"coord_origin": "TOPLEFT"
},
"text": ", pages 647-677. Springer London, London,",
"orig": ", pages 647-677. Springer London, London,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 183.2,
"r_x1": 97.9,
"r_y1": 183.2,
"r_x2": 97.9,
"r_y2": 175.1,
"r_x3": 70.0,
"r_y3": 175.1,
"coord_origin": "TOPLEFT"
},
"text": "2014. 2",
"orig": "2014. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 0,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 186.4,
"r": 286.4,
"b": 227.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 194.4,
"r_x1": 65.8,
"r_y1": 194.4,
"r_x2": 65.8,
"r_y2": 186.4,
"r_x3": 54.6,
"r_y3": 186.4,
"coord_origin": "TOPLEFT"
},
"text": "[4]",
"orig": "[4]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.2,
"r_y0": 194.4,
"r_x1": 286.4,
"r_y1": 194.4,
"r_x2": 286.4,
"r_y2": 186.4,
"r_x3": 68.2,
"r_y3": 186.4,
"coord_origin": "TOPLEFT"
},
"text": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun",
"orig": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 205.4,
"r_x1": 286.4,
"r_y1": 205.4,
"r_x2": 286.4,
"r_y2": 197.4,
"r_x3": 70.0,
"r_y3": 197.4,
"coord_origin": "TOPLEFT"
},
"text": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-",
"orig": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 216.3,
"r_x1": 286.4,
"r_y1": 216.3,
"r_x2": 286.4,
"r_y2": 208.3,
"r_x3": 70.0,
"r_y3": 208.3,
"coord_origin": "TOPLEFT"
},
"text": "DAR 2019 Competition on Table Detection and Recognition",
"orig": "DAR 2019 Competition on Table Detection and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 227.3,
"r_x1": 245.8,
"r_y1": 227.3,
"r_x2": 245.8,
"r_y2": 219.3,
"r_x3": 70.0,
"r_y3": 219.3,
"coord_origin": "TOPLEFT"
},
"text": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2",
"orig": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 230.6,
"r": 286.4,
"b": 271.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 238.6,
"r_x1": 65.4,
"r_y1": 238.6,
"r_x2": 65.4,
"r_y2": 230.6,
"r_x3": 54.6,
"r_y3": 230.6,
"coord_origin": "TOPLEFT"
},
"text": "[5]",
"orig": "[5]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.7,
"r_y0": 238.6,
"r_x1": 286.4,
"r_y1": 238.6,
"r_x2": 286.4,
"r_y2": 230.6,
"r_x3": 67.7,
"r_y3": 230.6,
"coord_origin": "TOPLEFT"
},
"text": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and",
"orig": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 249.5,
"r_x1": 286.4,
"r_y1": 249.5,
"r_x2": 286.4,
"r_y2": 241.5,
"r_x3": 70.0,
"r_y3": 241.5,
"coord_origin": "TOPLEFT"
},
"text": "Stavros J Perantonis. Automatic table detection in document",
"orig": "Stavros J Perantonis. Automatic table detection in document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 260.5,
"r_x1": 108.4,
"r_y1": 260.5,
"r_x2": 108.4,
"r_y2": 252.5,
"r_x3": 70.0,
"r_y3": 252.5,
"coord_origin": "TOPLEFT"
},
"text": "images. In",
"orig": "images. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.6,
"r_y0": 260.3,
"r_x1": 286.4,
"r_y1": 260.3,
"r_x2": 286.4,
"r_y2": 252.6,
"r_x3": 110.6,
"r_y3": 252.6,
"coord_origin": "TOPLEFT"
},
"text": "International Conference on Pattern Recognition",
"orig": "International Conference on Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 271.2,
"r_x1": 140.6,
"r_y1": 271.2,
"r_x2": 140.6,
"r_y2": 263.5,
"r_x3": 70.0,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "and Image Analysis",
"orig": "and Image Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.6,
"r_y0": 271.5,
"r_x1": 266.5,
"r_y1": 271.5,
"r_x2": 266.5,
"r_y2": 263.4,
"r_x3": 140.6,
"r_y3": 263.4,
"coord_origin": "TOPLEFT"
},
"text": ", pages 609-618. Springer, 2005. 2",
"orig": ", pages 609-618. Springer, 2005. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 274.7,
"r": 286.4,
"b": 315.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 282.7,
"r_x1": 64.8,
"r_y1": 282.7,
"r_x2": 64.8,
"r_y2": 274.7,
"r_x3": 54.6,
"r_y3": 274.7,
"coord_origin": "TOPLEFT"
},
"text": "[6]",
"orig": "[6]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.0,
"r_y0": 282.7,
"r_x1": 286.4,
"r_y1": 282.7,
"r_x2": 286.4,
"r_y2": 274.7,
"r_x3": 67.0,
"r_y3": 274.7,
"coord_origin": "TOPLEFT"
},
"text": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.",
"orig": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 293.7,
"r_x1": 179.6,
"r_y1": 293.7,
"r_x2": 179.6,
"r_y2": 285.7,
"r_x3": 70.0,
"r_y3": 285.7,
"coord_origin": "TOPLEFT"
},
"text": "Icdar 2013 table competition.",
"orig": "Icdar 2013 table competition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.0,
"r_y0": 293.7,
"r_x1": 194.5,
"r_y1": 293.7,
"r_x2": 194.5,
"r_y2": 285.7,
"r_x3": 187.0,
"r_y3": 285.7,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 198.0,
"r_y0": 293.5,
"r_x1": 286.4,
"r_y1": 293.5,
"r_x2": 286.4,
"r_y2": 285.7,
"r_x3": 198.0,
"r_y3": 285.7,
"coord_origin": "TOPLEFT"
},
"text": "2013 12th International",
"orig": "2013 12th International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 304.4,
"r_x1": 260.2,
"r_y1": 304.4,
"r_x2": 260.2,
"r_y2": 296.7,
"r_x3": 70.0,
"r_y3": 296.7,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Document Analysis and Recognition",
"orig": "Conference on Document Analysis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 260.2,
"r_y0": 304.6,
"r_x1": 286.4,
"r_y1": 304.6,
"r_x2": 286.4,
"r_y2": 296.6,
"r_x3": 260.2,
"r_y3": 296.6,
"coord_origin": "TOPLEFT"
},
"text": ", pages",
"orig": ", pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 315.6,
"r_x1": 142.7,
"r_y1": 315.6,
"r_x2": 142.7,
"r_y2": 307.6,
"r_x3": 70.0,
"r_y3": 307.6,
"coord_origin": "TOPLEFT"
},
"text": "1449-1453, 2013. 2",
"orig": "1449-1453, 2013. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 318.9,
"r": 286.4,
"b": 348.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 326.9,
"r_x1": 65.6,
"r_y1": 326.9,
"r_x2": 65.6,
"r_y2": 318.9,
"r_x3": 54.6,
"r_y3": 318.9,
"coord_origin": "TOPLEFT"
},
"text": "[7]",
"orig": "[7]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.0,
"r_y0": 326.9,
"r_x1": 199.5,
"r_y1": 326.9,
"r_x2": 199.5,
"r_y2": 318.9,
"r_x3": 68.0,
"r_y3": 318.9,
"coord_origin": "TOPLEFT"
},
"text": "EA Green and M Krishnamoorthy.",
"orig": "EA Green and M Krishnamoorthy.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.0,
"r_y0": 326.9,
"r_x1": 286.4,
"r_y1": 326.9,
"r_x2": 286.4,
"r_y2": 318.9,
"r_x3": 207.0,
"r_y3": 318.9,
"coord_origin": "TOPLEFT"
},
"text": "Recognition of tables",
"orig": "Recognition of tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 337.8,
"r_x1": 176.3,
"r_y1": 337.8,
"r_x2": 176.3,
"r_y2": 329.8,
"r_x3": 70.0,
"r_y3": 329.8,
"coord_origin": "TOPLEFT"
},
"text": "using table grammars. procs.",
"orig": "using table grammars. procs.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.6,
"r_y0": 337.8,
"r_x1": 190.1,
"r_y1": 337.8,
"r_x2": 190.1,
"r_y2": 329.8,
"r_x3": 182.6,
"r_y3": 329.8,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 193.3,
"r_y0": 337.6,
"r_x1": 286.4,
"r_y1": 337.6,
"r_x2": 286.4,
"r_y2": 329.9,
"r_x3": 193.3,
"r_y3": 329.9,
"coord_origin": "TOPLEFT"
},
"text": "Symposium on Document",
"orig": "Symposium on Document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 348.6,
"r_x1": 206.3,
"r_y1": 348.6,
"r_x2": 206.3,
"r_y2": 340.9,
"r_x3": 70.0,
"r_y3": 340.9,
"coord_origin": "TOPLEFT"
},
"text": "Analysis and Recognition (SDAIR\u201995)",
"orig": "Analysis and Recognition (SDAIR\u201995)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.3,
"r_y0": 348.8,
"r_x1": 274.8,
"r_y1": 348.8,
"r_x2": 274.8,
"r_y2": 340.8,
"r_x3": 206.3,
"r_y3": 340.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 261-277. 2",
"orig": ", pages 261-277. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 352.0,
"r": 286.4,
"b": 403.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 360.1,
"r_x1": 65.0,
"r_y1": 360.1,
"r_x2": 65.0,
"r_y2": 352.0,
"r_x3": 54.6,
"r_y3": 352.0,
"coord_origin": "TOPLEFT"
},
"text": "[8]",
"orig": "[8]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.3,
"r_y0": 360.1,
"r_x1": 286.4,
"r_y1": 360.1,
"r_x2": 286.4,
"r_y2": 352.0,
"r_x3": 67.3,
"r_y3": 352.0,
"coord_origin": "TOPLEFT"
},
"text": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-",
"orig": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 371.0,
"r_x1": 234.1,
"r_y1": 371.0,
"r_x2": 234.1,
"r_y2": 363.0,
"r_x3": 70.0,
"r_y3": 363.0,
"coord_origin": "TOPLEFT"
},
"text": "dier Stricker, and Muhammad Zeshan Afzal.",
"orig": "dier Stricker, and Muhammad Zeshan Afzal.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 240.1,
"r_y0": 371.0,
"r_x1": 286.4,
"r_y1": 371.0,
"r_x2": 286.4,
"r_y2": 363.0,
"r_x3": 240.1,
"r_y3": 363.0,
"coord_origin": "TOPLEFT"
},
"text": "Castabdetec-",
"orig": "Castabdetec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 382.0,
"r_x1": 286.4,
"r_y1": 382.0,
"r_x2": 286.4,
"r_y2": 374.0,
"r_x3": 70.0,
"r_y3": 374.0,
"coord_origin": "TOPLEFT"
},
"text": "tors: Cascade network for table detection in document im-",
"orig": "tors: Cascade network for table detection in document im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 392.9,
"r_x1": 286.4,
"r_y1": 392.9,
"r_x2": 286.4,
"r_y2": 384.9,
"r_x3": 70.0,
"r_y3": 384.9,
"coord_origin": "TOPLEFT"
},
"text": "ages with recursive feature pyramid and switchable atrous",
"orig": "ages with recursive feature pyramid and switchable atrous",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 403.9,
"r_x1": 114.6,
"r_y1": 403.9,
"r_x2": 114.6,
"r_y2": 395.9,
"r_x3": 70.0,
"r_y3": 395.9,
"coord_origin": "TOPLEFT"
},
"text": "convolution.",
"orig": "convolution.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 117.8,
"r_y0": 403.7,
"r_x1": 186.7,
"r_y1": 403.7,
"r_x2": 186.7,
"r_y2": 396.0,
"r_x3": 117.8,
"r_y3": 396.0,
"coord_origin": "TOPLEFT"
},
"text": "Journal of Imaging",
"orig": "Journal of Imaging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 186.7,
"r_y0": 403.9,
"r_x1": 243.0,
"r_y1": 403.9,
"r_x2": 243.0,
"r_y2": 395.9,
"r_x3": 186.7,
"r_y3": 395.9,
"coord_origin": "TOPLEFT"
},
"text": ", 7(10), 2021. 1",
"orig": ", 7(10), 2021. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 10,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 407.2,
"r": 286.4,
"b": 437.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 415.2,
"r_x1": 65.3,
"r_y1": 415.2,
"r_x2": 65.3,
"r_y2": 407.2,
"r_x3": 54.6,
"r_y3": 407.2,
"coord_origin": "TOPLEFT"
},
"text": "[9]",
"orig": "[9]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.6,
"r_y0": 415.2,
"r_x1": 286.4,
"r_y1": 415.2,
"r_x2": 286.4,
"r_y2": 407.2,
"r_x3": 67.6,
"r_y3": 407.2,
"coord_origin": "TOPLEFT"
},
"text": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-",
"orig": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 426.1,
"r_x1": 147.1,
"r_y1": 426.1,
"r_x2": 147.1,
"r_y2": 418.1,
"r_x3": 70.0,
"r_y3": 418.1,
"coord_origin": "TOPLEFT"
},
"text": "shick. Mask r-cnn. In",
"orig": "shick. Mask r-cnn. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 149.2,
"r_y0": 425.9,
"r_x1": 286.4,
"r_y1": 425.9,
"r_x2": 286.4,
"r_y2": 418.2,
"r_x3": 149.2,
"r_y3": 418.2,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE International",
"orig": "Proceedings of the IEEE International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 436.9,
"r_x1": 213.5,
"r_y1": 436.9,
"r_x2": 213.5,
"r_y2": 429.2,
"r_x3": 70.0,
"r_y3": 429.2,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision (ICCV)",
"orig": "Conference on Computer Vision (ICCV)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 213.5,
"r_y0": 437.1,
"r_x1": 261.0,
"r_y1": 437.1,
"r_x2": 261.0,
"r_y2": 429.1,
"r_x3": 213.5,
"r_y3": 429.1,
"coord_origin": "TOPLEFT"
},
"text": ", Oct 2017. 1",
"orig": ", Oct 2017. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 14,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 440.3,
"r": 286.4,
"b": 481.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 448.4,
"r_x1": 65.4,
"r_y1": 448.4,
"r_x2": 65.4,
"r_y2": 440.3,
"r_x3": 50.1,
"r_y3": 440.3,
"coord_origin": "TOPLEFT"
},
"text": "[10]",
"orig": "[10]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.7,
"r_y0": 448.4,
"r_x1": 286.4,
"r_y1": 448.4,
"r_x2": 286.4,
"r_y2": 440.3,
"r_x3": 67.7,
"r_y3": 440.3,
"coord_origin": "TOPLEFT"
},
"text": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-",
"orig": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 459.3,
"r_x1": 202.7,
"r_y1": 459.3,
"r_x2": 202.7,
"r_y2": 451.3,
"r_x3": 70.0,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": "cong Li, Xin Tang, and Rong Xiao.",
"orig": "cong Li, Xin Tang, and Rong Xiao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 459.3,
"r_x1": 286.4,
"r_y1": 459.3,
"r_x2": 286.4,
"r_y2": 451.3,
"r_x3": 209.0,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": "Pingan-vcgroup\u2019s so-",
"orig": "Pingan-vcgroup\u2019s so-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 470.3,
"r_x1": 286.4,
"r_y1": 470.3,
"r_x2": 286.4,
"r_y2": 462.3,
"r_x3": 70.0,
"r_y3": 462.3,
"coord_origin": "TOPLEFT"
},
"text": "lution for icdar 2021 competition on scientific table image",
"orig": "lution for icdar 2021 competition on scientific table image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 481.2,
"r_x1": 141.9,
"r_y1": 481.2,
"r_x2": 141.9,
"r_y2": 473.2,
"r_x3": 70.0,
"r_y3": 473.2,
"coord_origin": "TOPLEFT"
},
"text": "recognition to latex.",
"orig": "recognition to latex.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 145.1,
"r_y0": 481.0,
"r_x1": 166.0,
"r_y1": 481.0,
"r_x2": 166.0,
"r_y2": 473.3,
"r_x3": 145.1,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "ArXiv",
"orig": "ArXiv",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 166.0,
"r_y0": 481.2,
"r_x1": 259.9,
"r_y1": 481.2,
"r_x2": 259.9,
"r_y2": 473.2,
"r_x3": 166.0,
"r_y3": 473.2,
"coord_origin": "TOPLEFT"
},
"text": ", abs/2105.01846, 2021. 2",
"orig": ", abs/2105.01846, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 11,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 484.5,
"r": 286.4,
"b": 536.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 492.5,
"r_x1": 66.0,
"r_y1": 492.5,
"r_x2": 66.0,
"r_y2": 484.5,
"r_x3": 50.1,
"r_y3": 484.5,
"coord_origin": "TOPLEFT"
},
"text": "[11]",
"orig": "[11]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.4,
"r_y0": 492.5,
"r_x1": 286.4,
"r_y1": 492.5,
"r_x2": 286.4,
"r_y2": 484.5,
"r_x3": 68.4,
"r_y3": 484.5,
"coord_origin": "TOPLEFT"
},
"text": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and",
"orig": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 503.5,
"r_x1": 286.4,
"r_y1": 503.5,
"r_x2": 286.4,
"r_y2": 495.4,
"r_x3": 70.0,
"r_y3": 495.4,
"coord_origin": "TOPLEFT"
},
"text": "Gordon Wilfong. Medium-independent table detection. In",
"orig": "Gordon Wilfong. Medium-independent table detection. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 514.2,
"r_x1": 227.4,
"r_y1": 514.2,
"r_x2": 227.4,
"r_y2": 506.5,
"r_x3": 70.0,
"r_y3": 506.5,
"coord_origin": "TOPLEFT"
},
"text": "Document Recognition and Retrieval VII",
"orig": "Document Recognition and Retrieval VII",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.4,
"r_y0": 514.4,
"r_x1": 286.4,
"r_y1": 514.4,
"r_x2": 286.4,
"r_y2": 506.4,
"r_x3": 227.4,
"r_y3": 506.4,
"coord_origin": "TOPLEFT"
},
"text": ", volume 3967,",
"orig": ", volume 3967,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 525.4,
"r_x1": 286.4,
"r_y1": 525.4,
"r_x2": 286.4,
"r_y2": 517.4,
"r_x3": 70.0,
"r_y3": 517.4,
"coord_origin": "TOPLEFT"
},
"text": "pages 291-302. International Society for Optics and Photon-",
"orig": "pages 291-302. International Society for Optics and Photon-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 536.3,
"r_x1": 112.4,
"r_y1": 536.3,
"r_x2": 112.4,
"r_y2": 528.3,
"r_x3": 70.0,
"r_y3": 528.3,
"coord_origin": "TOPLEFT"
},
"text": "ics, 1999. 2",
"orig": "ics, 1999. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 5,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 539.6,
"r": 286.4,
"b": 591.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 547.6,
"r_x1": 65.5,
"r_y1": 547.6,
"r_x2": 65.5,
"r_y2": 539.6,
"r_x3": 50.1,
"r_y3": 539.6,
"coord_origin": "TOPLEFT"
},
"text": "[12]",
"orig": "[12]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 547.6,
"r_x1": 286.4,
"r_y1": 547.6,
"r_x2": 286.4,
"r_y2": 539.6,
"r_x3": 67.8,
"r_y3": 539.6,
"coord_origin": "TOPLEFT"
},
"text": "Matthew Hurst. A constraint-based approach to table struc-",
"orig": "Matthew Hurst. A constraint-based approach to table struc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 558.6,
"r_x1": 136.3,
"r_y1": 558.6,
"r_x2": 136.3,
"r_y2": 550.6,
"r_x3": 70.0,
"r_y3": 550.6,
"coord_origin": "TOPLEFT"
},
"text": "ture derivation. In",
"orig": "ture derivation. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.8,
"r_y0": 558.4,
"r_x1": 286.4,
"r_y1": 558.4,
"r_x2": 286.4,
"r_y2": 550.6,
"r_x3": 138.8,
"r_y3": 550.6,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the Seventh International",
"orig": "Proceedings of the Seventh International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 569.3,
"r_x1": 286.4,
"r_y1": 569.3,
"r_x2": 286.4,
"r_y2": 561.6,
"r_x3": 70.0,
"r_y3": 561.6,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Document Analysis and Recognition - Volume",
"orig": "Conference on Document Analysis and Recognition - Volume",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 580.3,
"r_x1": 74.5,
"r_y1": 580.3,
"r_x2": 74.5,
"r_y2": 572.6,
"r_x3": 70.0,
"r_y3": 572.6,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.5,
"r_y0": 580.5,
"r_x1": 286.4,
"r_y1": 580.5,
"r_x2": 286.4,
"r_y2": 572.5,
"r_x3": 74.5,
"r_y3": 572.5,
"coord_origin": "TOPLEFT"
},
"text": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-",
"orig": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 591.4,
"r_x1": 90.4,
"r_y1": 591.4,
"r_x2": 90.4,
"r_y2": 583.4,
"r_x3": 70.0,
"r_y3": 583.4,
"coord_origin": "TOPLEFT"
},
"text": "ety. 2",
"orig": "ety. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 13,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 594.7,
"r": 286.4,
"b": 646.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 602.7,
"r_x1": 66.3,
"r_y1": 602.7,
"r_x2": 66.3,
"r_y2": 594.7,
"r_x3": 50.1,
"r_y3": 594.7,
"coord_origin": "TOPLEFT"
},
"text": "[13]",
"orig": "[13]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.7,
"r_y0": 602.7,
"r_x1": 286.4,
"r_y1": 602.7,
"r_x2": 286.4,
"r_y2": 594.7,
"r_x3": 68.7,
"r_y3": 594.7,
"coord_origin": "TOPLEFT"
},
"text": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,",
"orig": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 613.7,
"r_x1": 286.4,
"r_y1": 613.7,
"r_x2": 286.4,
"r_y2": 605.7,
"r_x3": 70.0,
"r_y3": 605.7,
"coord_origin": "TOPLEFT"
},
"text": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect",
"orig": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 624.6,
"r_x1": 286.4,
"r_y1": 624.6,
"r_x2": 286.4,
"r_y2": 616.6,
"r_x3": 70.0,
"r_y3": 616.6,
"coord_origin": "TOPLEFT"
},
"text": "tables in scanned document images using line information.",
"orig": "tables in scanned document images using line information.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 635.6,
"r_x1": 77.5,
"r_y1": 635.6,
"r_x2": 77.5,
"r_y2": 627.6,
"r_x3": 70.0,
"r_y3": 627.6,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 79.9,
"r_y0": 635.4,
"r_x1": 286.4,
"r_y1": 635.4,
"r_x2": 286.4,
"r_y2": 627.7,
"r_x3": 79.9,
"r_y3": 627.7,
"coord_origin": "TOPLEFT"
},
"text": "2013 12th International Conference on Document Analy-",
"orig": "2013 12th International Conference on Document Analy-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 646.4,
"r_x1": 140.7,
"r_y1": 646.4,
"r_x2": 140.7,
"r_y2": 638.6,
"r_x3": 70.0,
"r_y3": 638.6,
"coord_origin": "TOPLEFT"
},
"text": "sis and Recognition",
"orig": "sis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.7,
"r_y0": 646.6,
"r_x1": 264.4,
"r_y1": 646.6,
"r_x2": 264.4,
"r_y2": 638.5,
"r_x3": 140.7,
"r_y3": 638.5,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1185-1189. IEEE, 2013. 2",
"orig": ", pages 1185-1189. IEEE, 2013. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 17,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 649.8,
"r": 286.4,
"b": 679.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 657.8,
"r_x1": 66.5,
"r_y1": 657.8,
"r_x2": 66.5,
"r_y2": 649.8,
"r_x3": 50.1,
"r_y3": 649.8,
"coord_origin": "TOPLEFT"
},
"text": "[14]",
"orig": "[14]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 69.0,
"r_y0": 657.8,
"r_x1": 286.4,
"r_y1": 657.8,
"r_x2": 286.4,
"r_y2": 649.8,
"r_x3": 69.0,
"r_y3": 649.8,
"coord_origin": "TOPLEFT"
},
"text": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank",
"orig": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 668.8,
"r_x1": 93.2,
"r_y1": 668.8,
"r_x2": 93.2,
"r_y2": 660.8,
"r_x3": 70.0,
"r_y3": 660.8,
"coord_origin": "TOPLEFT"
},
"text": "Singh.",
"orig": "Singh.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 102.2,
"r_y0": 668.8,
"r_x1": 286.4,
"r_y1": 668.8,
"r_x2": 286.4,
"r_y2": 660.8,
"r_x3": 102.2,
"r_y3": 660.8,
"coord_origin": "TOPLEFT"
},
"text": "Icdar 2021 competition on scientific table image",
"orig": "Icdar 2021 competition on scientific table image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 679.7,
"r_x1": 172.0,
"r_y1": 679.7,
"r_x2": 172.0,
"r_y2": 671.7,
"r_x3": 70.0,
"r_y3": 671.7,
"coord_origin": "TOPLEFT"
},
"text": "recognition to latex, 2021. 2",
"orig": "recognition to latex, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 16,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 683.0,
"r": 286.4,
"b": 712.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 691.0,
"r_x1": 65.5,
"r_y1": 691.0,
"r_x2": 65.5,
"r_y2": 683.0,
"r_x3": 50.1,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "[15]",
"orig": "[15]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 691.0,
"r_x1": 286.4,
"r_y1": 691.0,
"r_x2": 286.4,
"r_y2": 683.0,
"r_x3": 67.8,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Harold W Kuhn. The hungarian method for the assignment",
"orig": "Harold W Kuhn. The hungarian method for the assignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 702.0,
"r_x1": 102.2,
"r_y1": 702.0,
"r_x2": 102.2,
"r_y2": 694.0,
"r_x3": 70.0,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "problem.",
"orig": "problem.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 107.5,
"r_y0": 701.8,
"r_x1": 231.5,
"r_y1": 701.8,
"r_x2": 231.5,
"r_y2": 694.0,
"r_x3": 107.5,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Naval research logistics quarterly",
"orig": "Naval research logistics quarterly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 231.5,
"r_y0": 702.0,
"r_x1": 286.4,
"r_y1": 702.0,
"r_x2": 286.4,
"r_y2": 694.0,
"r_x3": 231.5,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": ", 2(1-2):83-97,",
"orig": ", 2(1-2):83-97,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 712.9,
"r_x1": 97.9,
"r_y1": 712.9,
"r_x2": 97.9,
"r_y2": 704.9,
"r_x3": 70.0,
"r_y3": 704.9,
"coord_origin": "TOPLEFT"
},
"text": "1955. 6",
"orig": "1955. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 6,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 75.9,
"r": 545.1,
"b": 138.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 83.9,
"r_x1": 324.7,
"r_y1": 83.9,
"r_x2": 324.7,
"r_y2": 75.9,
"r_x3": 308.9,
"r_y3": 75.9,
"coord_origin": "TOPLEFT"
},
"text": "[16]",
"orig": "[16]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.1,
"r_y0": 83.9,
"r_x1": 545.1,
"r_y1": 83.9,
"r_x2": 545.1,
"r_y2": 75.9,
"r_x3": 327.1,
"r_y3": 75.9,
"coord_origin": "TOPLEFT"
},
"text": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-",
"orig": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 94.9,
"r_x1": 545.1,
"r_y1": 94.9,
"r_x2": 545.1,
"r_y2": 86.8,
"r_x3": 328.8,
"r_y3": 86.8,
"coord_origin": "TOPLEFT"
},
"text": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and",
"orig": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 105.8,
"r_x1": 391.0,
"r_y1": 105.8,
"r_x2": 391.0,
"r_y2": 97.8,
"r_x3": 328.8,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Tamara L. Berg.",
"orig": "Tamara L. Berg.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.3,
"r_y0": 105.8,
"r_x1": 435.1,
"r_y1": 105.8,
"r_x2": 435.1,
"r_y2": 97.8,
"r_x3": 400.3,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Babytalk:",
"orig": "Babytalk:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.7,
"r_y0": 105.8,
"r_x1": 545.1,
"r_y1": 105.8,
"r_x2": 545.1,
"r_y2": 97.8,
"r_x3": 441.7,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Understanding and generat-",
"orig": "Understanding and generat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 116.8,
"r_x1": 440.8,
"r_y1": 116.8,
"r_x2": 440.8,
"r_y2": 108.8,
"r_x3": 328.8,
"r_y3": 108.8,
"coord_origin": "TOPLEFT"
},
"text": "ing simple image descriptions.",
"orig": "ing simple image descriptions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 446.6,
"r_y0": 116.6,
"r_x1": 545.1,
"r_y1": 116.6,
"r_x2": 545.1,
"r_y2": 108.8,
"r_x3": 446.6,
"r_y3": 108.8,
"coord_origin": "TOPLEFT"
},
"text": "IEEE Transactions on Pat-",
"orig": "IEEE Transactions on Pat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 127.5,
"r_x1": 471.1,
"r_y1": 127.5,
"r_x2": 471.1,
"r_y2": 119.8,
"r_x3": 328.8,
"r_y3": 119.8,
"coord_origin": "TOPLEFT"
},
"text": "tern Analysis and Machine Intelligence",
"orig": "tern Analysis and Machine Intelligence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 471.1,
"r_y0": 127.7,
"r_x1": 545.1,
"r_y1": 127.7,
"r_x2": 545.1,
"r_y2": 119.7,
"r_x3": 471.1,
"r_y3": 119.7,
"coord_origin": "TOPLEFT"
},
"text": ", 35(12):2891-2903,",
"orig": ", 35(12):2891-2903,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 138.7,
"r_x1": 356.7,
"r_y1": 138.7,
"r_x2": 356.7,
"r_y2": 130.7,
"r_x3": 328.8,
"r_y3": 130.7,
"coord_origin": "TOPLEFT"
},
"text": "2013. 4",
"orig": "2013. 4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 15,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 142.1,
"r": 545.1,
"b": 172.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 150.1,
"r_x1": 325.2,
"r_y1": 150.1,
"r_x2": 325.2,
"r_y2": 142.1,
"r_x3": 308.9,
"r_y3": 142.1,
"coord_origin": "TOPLEFT"
},
"text": "[17]",
"orig": "[17]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.7,
"r_y0": 150.1,
"r_x1": 545.1,
"r_y1": 150.1,
"r_x2": 545.1,
"r_y2": 142.1,
"r_x3": 327.7,
"r_y3": 142.1,
"coord_origin": "TOPLEFT"
},
"text": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming",
"orig": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 161.1,
"r_x1": 414.4,
"r_y1": 161.1,
"r_x2": 414.4,
"r_y2": 153.1,
"r_x3": 328.8,
"r_y3": 153.1,
"coord_origin": "TOPLEFT"
},
"text": "Zhou, and Zhoujun Li.",
"orig": "Zhou, and Zhoujun Li.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 421.8,
"r_y0": 161.1,
"r_x1": 545.1,
"r_y1": 161.1,
"r_x2": 545.1,
"r_y2": 153.1,
"r_x3": 421.8,
"r_y3": 153.1,
"coord_origin": "TOPLEFT"
},
"text": "Tablebank: A benchmark dataset",
"orig": "Tablebank: A benchmark dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 172.1,
"r_x1": 493.6,
"r_y1": 172.1,
"r_x2": 493.6,
"r_y2": 164.0,
"r_x3": 328.8,
"r_y3": 164.0,
"coord_origin": "TOPLEFT"
},
"text": "for table detection and recognition, 2019. 2, 3",
"orig": "for table detection and recognition, 2019. 2, 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 12,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 175.5,
"r": 545.1,
"b": 260.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 183.5,
"r_x1": 324.3,
"r_y1": 183.5,
"r_x2": 324.3,
"r_y2": 175.5,
"r_x3": 308.9,
"r_y3": 175.5,
"coord_origin": "TOPLEFT"
},
"text": "[18]",
"orig": "[18]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.6,
"r_y0": 183.5,
"r_x1": 545.1,
"r_y1": 183.5,
"r_x2": 545.1,
"r_y2": 175.5,
"r_x3": 326.6,
"r_y3": 175.5,
"coord_origin": "TOPLEFT"
},
"text": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and",
"orig": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 194.5,
"r_x1": 545.1,
"r_y1": 194.5,
"r_x2": 545.1,
"r_y2": 186.4,
"r_x3": 328.8,
"r_y3": 186.4,
"coord_origin": "TOPLEFT"
},
"text": "Xianhui Liu. Gfte: Graph-based financial table extraction.",
"orig": "Xianhui Liu. Gfte: Graph-based financial table extraction.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 205.4,
"r_x1": 545.1,
"r_y1": 205.4,
"r_x2": 545.1,
"r_y2": 197.4,
"r_x3": 328.8,
"r_y3": 197.4,
"coord_origin": "TOPLEFT"
},
"text": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-",
"orig": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 216.4,
"r_x1": 545.1,
"r_y1": 216.4,
"r_x2": 545.1,
"r_y2": 208.4,
"r_x3": 328.8,
"r_y3": 208.4,
"coord_origin": "TOPLEFT"
},
"text": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair",
"orig": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 227.3,
"r_x1": 479.3,
"r_y1": 227.3,
"r_x2": 479.3,
"r_y2": 219.3,
"r_x3": 328.8,
"r_y3": 219.3,
"coord_origin": "TOPLEFT"
},
"text": "Escalante, and Roberto Vezzani, editors,",
"orig": "Escalante, and Roberto Vezzani, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.1,
"r_y0": 227.1,
"r_x1": 545.1,
"r_y1": 227.1,
"r_x2": 545.1,
"r_y2": 219.4,
"r_x3": 483.1,
"r_y3": 219.4,
"coord_origin": "TOPLEFT"
},
"text": "Pattern Recogni-",
"orig": "Pattern Recogni-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 238.1,
"r_x1": 519.4,
"r_y1": 238.1,
"r_x2": 519.4,
"r_y2": 230.4,
"r_x3": 328.8,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "tion. ICPR International Workshops and Challenges",
"orig": "tion. ICPR International Workshops and Challenges",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 519.4,
"r_y0": 238.3,
"r_x1": 545.1,
"r_y1": 238.3,
"r_x2": 545.1,
"r_y2": 230.3,
"r_x3": 519.4,
"r_y3": 230.3,
"coord_origin": "TOPLEFT"
},
"text": ", pages",
"orig": ", pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 249.3,
"r_x1": 545.1,
"r_y1": 249.3,
"r_x2": 545.1,
"r_y2": 241.2,
"r_x3": 328.8,
"r_y3": 241.2,
"coord_origin": "TOPLEFT"
},
"text": "644-658, Cham, 2021. Springer International Publishing. 2,",
"orig": "644-658, Cham, 2021. Springer International Publishing. 2,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 260.2,
"r_x1": 333.3,
"r_y1": 260.2,
"r_x2": 333.3,
"r_y2": 252.2,
"r_x3": 328.8,
"r_y3": 252.2,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 8,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 263.6,
"r": 545.1,
"b": 326.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 271.7,
"r_x1": 324.3,
"r_y1": 271.7,
"r_x2": 324.3,
"r_y2": 263.6,
"r_x3": 308.9,
"r_y3": 263.6,
"coord_origin": "TOPLEFT"
},
"text": "[19]",
"orig": "[19]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.6,
"r_y0": 271.7,
"r_x1": 545.1,
"r_y1": 271.7,
"r_x2": 545.1,
"r_y2": 263.6,
"r_x3": 326.6,
"r_y3": 263.6,
"coord_origin": "TOPLEFT"
},
"text": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-",
"orig": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 282.6,
"r_x1": 545.1,
"r_y1": 282.6,
"r_x2": 545.1,
"r_y2": 274.6,
"r_x3": 328.8,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele",
"orig": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 293.6,
"r_x1": 545.1,
"r_y1": 293.6,
"r_x2": 545.1,
"r_y2": 285.6,
"r_x3": 328.8,
"r_y3": 285.6,
"coord_origin": "TOPLEFT"
},
"text": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-",
"orig": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 304.5,
"r_x1": 545.1,
"r_y1": 304.5,
"r_x2": 545.1,
"r_y2": 296.5,
"r_x3": 328.8,
"r_y3": 296.5,
"coord_origin": "TOPLEFT"
},
"text": "bust pdf document conversion using recurrent neural net-",
"orig": "bust pdf document conversion using recurrent neural net-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 315.5,
"r_x1": 352.8,
"r_y1": 315.5,
"r_x2": 352.8,
"r_y2": 307.5,
"r_x3": 328.8,
"r_y3": 307.5,
"coord_origin": "TOPLEFT"
},
"text": "works.",
"orig": "works.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.2,
"r_y0": 315.3,
"r_x1": 545.1,
"r_y1": 315.3,
"r_x2": 545.1,
"r_y2": 307.6,
"r_x3": 360.2,
"r_y3": 307.6,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the AAAI Conference on Artificial",
"orig": "Proceedings of the AAAI Conference on Artificial",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 326.2,
"r_x1": 371.0,
"r_y1": 326.2,
"r_x2": 371.0,
"r_y2": 318.5,
"r_x3": 328.8,
"r_y3": 318.5,
"coord_origin": "TOPLEFT"
},
"text": "Intelligence",
"orig": "Intelligence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 371.0,
"r_y0": 326.5,
"r_x1": 502.3,
"r_y1": 326.5,
"r_x2": 502.3,
"r_y2": 318.4,
"r_x3": 371.0,
"r_y3": 318.4,
"coord_origin": "TOPLEFT"
},
"text": ", 35(17):15137-15145, May 2021. 1",
"orig": ", 35(17):15137-15145, May 2021. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 18,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 329.9,
"r": 545.1,
"b": 370.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 337.9,
"r_x1": 323.8,
"r_y1": 337.9,
"r_x2": 323.8,
"r_y2": 329.9,
"r_x3": 308.9,
"r_y3": 329.9,
"coord_origin": "TOPLEFT"
},
"text": "[20]",
"orig": "[20]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.1,
"r_y0": 337.9,
"r_x1": 545.1,
"r_y1": 337.9,
"r_x2": 545.1,
"r_y2": 329.9,
"r_x3": 326.1,
"r_y3": 329.9,
"coord_origin": "TOPLEFT"
},
"text": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,",
"orig": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 348.9,
"r_x1": 545.1,
"r_y1": 348.9,
"r_x2": 545.1,
"r_y2": 340.8,
"r_x3": 328.8,
"r_y3": 340.8,
"coord_origin": "TOPLEFT"
},
"text": "Yongpan Wang, and Gui-Song Xia. Parsing table structures",
"orig": "Yongpan Wang, and Gui-Song Xia. Parsing table structures",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 359.8,
"r_x1": 382.8,
"r_y1": 359.8,
"r_x2": 382.8,
"r_y2": 351.8,
"r_x3": 328.8,
"r_y3": 351.8,
"coord_origin": "TOPLEFT"
},
"text": "in the wild. In",
"orig": "in the wild. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.5,
"r_y0": 359.6,
"r_x1": 545.1,
"r_y1": 359.6,
"r_x2": 545.1,
"r_y2": 351.9,
"r_x3": 385.5,
"r_y3": 351.9,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF International",
"orig": "Proceedings of the IEEE/CVF International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 370.6,
"r_x1": 443.6,
"r_y1": 370.6,
"r_x2": 443.6,
"r_y2": 362.8,
"r_x3": 328.8,
"r_y3": 362.8,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision",
"orig": "Conference on Computer Vision",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 443.6,
"r_y0": 370.8,
"r_x1": 534.5,
"r_y1": 370.8,
"r_x2": 534.5,
"r_y2": 362.8,
"r_x3": 443.6,
"r_y3": 362.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 944-952, 2021. 2",
"orig": ", pages 944-952, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 21,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 374.2,
"r": 545.1,
"b": 437.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 382.2,
"r_x1": 324.6,
"r_y1": 382.2,
"r_x2": 324.6,
"r_y2": 374.2,
"r_x3": 308.9,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "[21]",
"orig": "[21]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.0,
"r_y0": 382.2,
"r_x1": 362.7,
"r_y1": 382.2,
"r_x2": 362.7,
"r_y2": 374.2,
"r_x3": 327.0,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Shubham",
"orig": "Shubham",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 368.7,
"r_y0": 382.2,
"r_x1": 389.6,
"r_y1": 382.2,
"r_x2": 389.6,
"r_y2": 374.2,
"r_x3": 368.7,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Singh",
"orig": "Singh",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 395.6,
"r_y0": 382.2,
"r_x1": 424.6,
"r_y1": 382.2,
"r_x2": 424.6,
"r_y2": 374.2,
"r_x3": 395.6,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Paliwal,",
"orig": "Paliwal,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.5,
"r_y0": 382.2,
"r_x1": 438.0,
"r_y1": 382.2,
"r_x2": 438.0,
"r_y2": 374.2,
"r_x3": 431.5,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "D",
"orig": "D",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 444.1,
"r_y0": 382.2,
"r_x1": 488.5,
"r_y1": 382.2,
"r_x2": 488.5,
"r_y2": 374.2,
"r_x3": 444.1,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Vishwanath,",
"orig": "Vishwanath,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 495.5,
"r_y0": 382.2,
"r_x1": 515.4,
"r_y1": 382.2,
"r_x2": 515.4,
"r_y2": 374.2,
"r_x3": 495.5,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Rohit",
"orig": "Rohit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 521.4,
"r_y0": 382.2,
"r_x1": 545.1,
"r_y1": 382.2,
"r_x2": 545.1,
"r_y2": 374.2,
"r_x3": 521.4,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Rahul,",
"orig": "Rahul,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 393.2,
"r_x1": 545.1,
"r_y1": 393.2,
"r_x2": 545.1,
"r_y2": 385.2,
"r_x3": 328.8,
"r_y3": 385.2,
"coord_origin": "TOPLEFT"
},
"text": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-",
"orig": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 404.1,
"r_x1": 545.1,
"r_y1": 404.1,
"r_x2": 545.1,
"r_y2": 396.1,
"r_x3": 328.8,
"r_y3": 396.1,
"coord_origin": "TOPLEFT"
},
"text": "ing model for end-to-end table detection and tabular data ex-",
"orig": "ing model for end-to-end table detection and tabular data ex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 415.1,
"r_x1": 478.0,
"r_y1": 415.1,
"r_x2": 478.0,
"r_y2": 407.1,
"r_x3": 328.8,
"r_y3": 407.1,
"coord_origin": "TOPLEFT"
},
"text": "traction from scanned document images.",
"orig": "traction from scanned document images.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 484.1,
"r_y0": 415.1,
"r_x1": 491.5,
"r_y1": 415.1,
"r_x2": 491.5,
"r_y2": 407.1,
"r_x3": 484.1,
"r_y3": 407.1,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 494.7,
"r_y0": 414.9,
"r_x1": 545.1,
"r_y1": 414.9,
"r_x2": 545.1,
"r_y2": 407.2,
"r_x3": 494.7,
"r_y3": 407.2,
"coord_origin": "TOPLEFT"
},
"text": "2019 Interna-",
"orig": "2019 Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 425.9,
"r_x1": 545.1,
"r_y1": 425.9,
"r_x2": 545.1,
"r_y2": 418.1,
"r_x3": 328.8,
"r_y3": 418.1,
"coord_origin": "TOPLEFT"
},
"text": "tional Conference on Document Analysis and Recognition",
"orig": "tional Conference on Document Analysis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 436.8,
"r_x1": 360.8,
"r_y1": 436.8,
"r_x2": 360.8,
"r_y2": 429.1,
"r_x3": 328.8,
"r_y3": 429.1,
"coord_origin": "TOPLEFT"
},
"text": "(ICDAR)",
"orig": "(ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.8,
"r_y0": 437.0,
"r_x1": 475.6,
"r_y1": 437.0,
"r_x2": 475.6,
"r_y2": 429.0,
"r_x3": 360.8,
"r_y3": 429.0,
"coord_origin": "TOPLEFT"
},
"text": ", pages 128-133. IEEE, 2019. 1",
"orig": ", pages 128-133. IEEE, 2019. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 20,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 440.4,
"r": 545.1,
"b": 558.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 448.5,
"r_x1": 324.6,
"r_y1": 448.5,
"r_x2": 324.6,
"r_y2": 440.4,
"r_x3": 308.9,
"r_y3": 440.4,
"coord_origin": "TOPLEFT"
},
"text": "[22]",
"orig": "[22]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.9,
"r_y0": 448.5,
"r_x1": 545.1,
"r_y1": 448.5,
"r_x2": 545.1,
"r_y2": 440.4,
"r_x3": 326.9,
"r_y3": 440.4,
"coord_origin": "TOPLEFT"
},
"text": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,",
"orig": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 459.4,
"r_x1": 545.1,
"r_y1": 459.4,
"r_x2": 545.1,
"r_y2": 451.4,
"r_x3": 328.8,
"r_y3": 451.4,
"coord_origin": "TOPLEFT"
},
"text": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming",
"orig": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 470.4,
"r_x1": 545.1,
"r_y1": 470.4,
"r_x2": 545.1,
"r_y2": 462.4,
"r_x3": 328.8,
"r_y3": 462.4,
"coord_origin": "TOPLEFT"
},
"text": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,",
"orig": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 481.3,
"r_x1": 545.1,
"r_y1": 481.3,
"r_x2": 545.1,
"r_y2": 473.3,
"r_x3": 328.8,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-",
"orig": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 492.3,
"r_x1": 545.1,
"r_y1": 492.3,
"r_x2": 545.1,
"r_y2": 484.3,
"r_x3": 328.8,
"r_y3": 484.3,
"coord_origin": "TOPLEFT"
},
"text": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,",
"orig": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 503.3,
"r_x1": 545.1,
"r_y1": 503.3,
"r_x2": 545.1,
"r_y2": 495.2,
"r_x3": 328.8,
"r_y3": 495.2,
"coord_origin": "TOPLEFT"
},
"text": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-",
"orig": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 514.2,
"r_x1": 545.1,
"r_y1": 514.2,
"r_x2": 545.1,
"r_y2": 506.2,
"r_x3": 328.8,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "perative style, high-performance deep learning library. In H.",
"orig": "perative style, high-performance deep learning library. In H.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 525.2,
"r_x1": 545.1,
"r_y1": 525.2,
"r_x2": 545.1,
"r_y2": 517.2,
"r_x3": 328.8,
"r_y3": 517.2,
"coord_origin": "TOPLEFT"
},
"text": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.",
"orig": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 536.1,
"r_x1": 434.6,
"r_y1": 536.1,
"r_x2": 434.6,
"r_y2": 528.1,
"r_x3": 328.8,
"r_y3": 528.1,
"coord_origin": "TOPLEFT"
},
"text": "Fox, and R. Garnett, editors,",
"orig": "Fox, and R. Garnett, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.9,
"r_y0": 535.9,
"r_x1": 545.1,
"r_y1": 535.9,
"r_x2": 545.1,
"r_y2": 528.2,
"r_x3": 437.9,
"r_y3": 528.2,
"coord_origin": "TOPLEFT"
},
"text": "Advances in Neural Informa-",
"orig": "Advances in Neural Informa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 546.9,
"r_x1": 425.7,
"r_y1": 546.9,
"r_x2": 425.7,
"r_y2": 539.2,
"r_x3": 328.8,
"r_y3": 539.2,
"coord_origin": "TOPLEFT"
},
"text": "tion Processing Systems 32",
"orig": "tion Processing Systems 32",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 425.7,
"r_y0": 547.1,
"r_x1": 545.1,
"r_y1": 547.1,
"r_x2": 545.1,
"r_y2": 539.1,
"r_x3": 425.7,
"r_y3": 539.1,
"coord_origin": "TOPLEFT"
},
"text": ", pages 8024-8035. Curran Asso-",
"orig": ", pages 8024-8035. Curran Asso-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 558.1,
"r_x1": 399.7,
"r_y1": 558.1,
"r_x2": 399.7,
"r_y2": 550.0,
"r_x3": 328.8,
"r_y3": 550.0,
"coord_origin": "TOPLEFT"
},
"text": "ciates, Inc., 2019. 6",
"orig": "ciates, Inc., 2019. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 19,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 561.5,
"r": 545.1,
"b": 624.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 569.5,
"r_x1": 324.5,
"r_y1": 569.5,
"r_x2": 324.5,
"r_y2": 561.5,
"r_x3": 308.9,
"r_y3": 561.5,
"coord_origin": "TOPLEFT"
},
"text": "[23]",
"orig": "[23]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.9,
"r_y0": 569.5,
"r_x1": 545.1,
"r_y1": 569.5,
"r_x2": 545.1,
"r_y2": 561.5,
"r_x3": 326.9,
"r_y3": 561.5,
"coord_origin": "TOPLEFT"
},
"text": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish",
"orig": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 580.5,
"r_x1": 545.1,
"r_y1": 580.5,
"r_x2": 545.1,
"r_y2": 572.4,
"r_x3": 328.8,
"r_y3": 572.4,
"coord_origin": "TOPLEFT"
},
"text": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach",
"orig": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 591.4,
"r_x1": 545.1,
"r_y1": 591.4,
"r_x2": 545.1,
"r_y2": 583.4,
"r_x3": 328.8,
"r_y3": 583.4,
"coord_origin": "TOPLEFT"
},
"text": "for end to end table detection and structure recognition from",
"orig": "for end to end table detection and structure recognition from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 602.4,
"r_x1": 431.6,
"r_y1": 602.4,
"r_x2": 431.6,
"r_y2": 594.4,
"r_x3": 328.8,
"r_y3": 594.4,
"coord_origin": "TOPLEFT"
},
"text": "image-based documents. In",
"orig": "image-based documents. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 434.7,
"r_y0": 602.2,
"r_x1": 545.1,
"r_y1": 602.2,
"r_x2": 545.1,
"r_y2": 594.4,
"r_x3": 434.7,
"r_y3": 594.4,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF",
"orig": "Proceedings of the IEEE/CVF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 613.1,
"r_x1": 545.1,
"r_y1": 613.1,
"r_x2": 545.1,
"r_y2": 605.4,
"r_x3": 328.8,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision and Pattern Recognition",
"orig": "Conference on Computer Vision and Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 624.1,
"r_x1": 367.8,
"r_y1": 624.1,
"r_x2": 367.8,
"r_y2": 616.4,
"r_x3": 328.8,
"r_y3": 616.4,
"coord_origin": "TOPLEFT"
},
"text": "Workshops",
"orig": "Workshops",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.8,
"r_y0": 624.3,
"r_x1": 458.7,
"r_y1": 624.3,
"r_x2": 458.7,
"r_y2": 616.3,
"r_x3": 367.8,
"r_y3": 616.3,
"coord_origin": "TOPLEFT"
},
"text": ", pages 572-573, 2020. 1",
"orig": ", pages 572-573, 2020. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 23,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 627.7,
"r": 545.1,
"b": 668.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 635.7,
"r_x1": 324.7,
"r_y1": 635.7,
"r_x2": 324.7,
"r_y2": 627.7,
"r_x3": 308.9,
"r_y3": 627.7,
"coord_origin": "TOPLEFT"
},
"text": "[24]",
"orig": "[24]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.1,
"r_y0": 635.7,
"r_x1": 545.1,
"r_y1": 635.7,
"r_x2": 545.1,
"r_y2": 627.7,
"r_x3": 327.1,
"r_y3": 627.7,
"coord_origin": "TOPLEFT"
},
"text": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.",
"orig": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 646.7,
"r_x1": 545.1,
"r_y1": 646.7,
"r_x2": 545.1,
"r_y2": 638.7,
"r_x3": 328.8,
"r_y3": 638.7,
"coord_origin": "TOPLEFT"
},
"text": "Rethinking table recognition using graph neural networks.",
"orig": "Rethinking table recognition using graph neural networks.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 657.7,
"r_x1": 336.3,
"r_y1": 657.7,
"r_x2": 336.3,
"r_y2": 649.6,
"r_x3": 328.8,
"r_y3": 649.6,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 338.1,
"r_y0": 657.4,
"r_x1": 545.1,
"r_y1": 657.4,
"r_x2": 545.1,
"r_y2": 649.7,
"r_x3": 338.1,
"r_y3": 649.7,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 668.4,
"r_x1": 406.3,
"r_y1": 668.4,
"r_x2": 406.3,
"r_y2": 660.7,
"r_x3": 328.8,
"r_y3": 660.7,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.3,
"r_y0": 668.6,
"r_x1": 521.1,
"r_y1": 668.6,
"r_x2": 521.1,
"r_y2": 660.6,
"r_x3": 406.3,
"r_y3": 660.6,
"coord_origin": "TOPLEFT"
},
"text": ", pages 142-147. IEEE, 2019. 3",
"orig": ", pages 142-147. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 24,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 672.0,
"r": 545.1,
"b": 712.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.87,
"cells": [
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 680.1,
"r_x1": 324.7,
"r_y1": 680.1,
"r_x2": 324.7,
"r_y2": 672.0,
"r_x3": 308.9,
"r_y3": 672.0,
"coord_origin": "TOPLEFT"
},
"text": "[25]",
"orig": "[25]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.1,
"r_y0": 680.1,
"r_x1": 545.1,
"r_y1": 680.1,
"r_x2": 545.1,
"r_y2": 672.0,
"r_x3": 327.1,
"r_y3": 672.0,
"coord_origin": "TOPLEFT"
},
"text": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir",
"orig": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 691.0,
"r_x1": 482.8,
"r_y1": 691.0,
"r_x2": 482.8,
"r_y2": 683.0,
"r_x3": 328.8,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Sadeghian, Ian Reid, and Silvio Savarese.",
"orig": "Sadeghian, Ian Reid, and Silvio Savarese.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.8,
"r_y0": 691.0,
"r_x1": 545.1,
"r_y1": 691.0,
"r_x2": 545.1,
"r_y2": 683.0,
"r_x3": 488.8,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Generalized in-",
"orig": "Generalized in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 702.0,
"r_x1": 545.1,
"r_y1": 702.0,
"r_x2": 545.1,
"r_y2": 694.0,
"r_x3": 328.8,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "tersection over union: A metric and a loss for bounding box",
"orig": "tersection over union: A metric and a loss for bounding box",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 712.9,
"r_x1": 379.2,
"r_y1": 712.9,
"r_x2": 379.2,
"r_y2": 704.9,
"r_x3": 328.8,
"r_y3": 704.9,
"coord_origin": "TOPLEFT"
},
"text": "regression. In",
"orig": "regression. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 381.6,
"r_y0": 712.7,
"r_x1": 545.1,
"r_y1": 712.7,
"r_x2": 545.1,
"r_y2": 705.0,
"r_x3": 381.6,
"r_y3": 705.0,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF Conference on",
"orig": "Proceedings of the IEEE/CVF Conference on",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 22,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"tablestructure": {
"table_map": {}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "list_item",
"id": 25,
"page_no": 8,
"cluster": {
"id": 25,
"label": "list_item",
"bbox": {
"l": 70.0,
"t": 75.9,
"r": 286.4,
"b": 116.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.73,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 83.9,
"r_x1": 286.4,
"r_y1": 83.9,
"r_x2": 286.4,
"r_y2": 75.9,
"r_x3": 70.0,
"r_y3": 75.9,
"coord_origin": "TOPLEFT"
},
"text": "end object detection with transformers. In Andrea Vedaldi,",
"orig": "end object detection with transformers. In Andrea Vedaldi,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 94.9,
"r_x1": 286.4,
"r_y1": 94.9,
"r_x2": 286.4,
"r_y2": 86.8,
"r_x3": 70.0,
"r_y3": 86.8,
"coord_origin": "TOPLEFT"
},
"text": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-",
"orig": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 105.8,
"r_x1": 85.7,
"r_y1": 105.8,
"r_x2": 85.7,
"r_y2": 97.8,
"r_x3": 70.0,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "tors,",
"orig": "tors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 87.9,
"r_y0": 105.6,
"r_x1": 199.9,
"r_y1": 105.6,
"r_x2": 199.9,
"r_y2": 97.9,
"r_x3": 87.9,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision - ECCV 2020",
"orig": "Computer Vision - ECCV 2020",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 199.9,
"r_y0": 105.8,
"r_x1": 286.4,
"r_y1": 105.8,
"r_x2": 286.4,
"r_y2": 97.8,
"r_x3": 199.9,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 213-229, Cham,",
"orig": ", pages 213-229, Cham,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 116.8,
"r_x1": 221.9,
"r_y1": 116.8,
"r_x2": 221.9,
"r_y2": 108.8,
"r_x3": 70.0,
"r_y3": 108.8,
"coord_origin": "TOPLEFT"
},
"text": "2020. Springer International Publishing. 5",
"orig": "2020. Springer International Publishing. 5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "end object detection with transformers. In Andrea Vedaldi, Horst Bischof, Thomas Brox, and Jan-Michael Frahm, editors, Computer Vision - ECCV 2020 , pages 213-229, Cham, 2020. Springer International Publishing. 5"
},
{
"label": "list_item",
"id": 9,
"page_no": 8,
"cluster": {
"id": 9,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 120.0,
"r": 286.4,
"b": 150.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 128.0,
"r_x1": 65.2,
"r_y1": 128.0,
"r_x2": 65.2,
"r_y2": 120.0,
"r_x3": 54.6,
"r_y3": 120.0,
"coord_origin": "TOPLEFT"
},
"text": "[2]",
"orig": "[2]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.5,
"r_y0": 128.0,
"r_x1": 286.4,
"r_y1": 128.0,
"r_x2": 286.4,
"r_y2": 120.0,
"r_x3": 67.5,
"r_y3": 120.0,
"coord_origin": "TOPLEFT"
},
"text": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-",
"orig": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 139.0,
"r_x1": 179.7,
"r_y1": 139.0,
"r_x2": 179.7,
"r_y2": 131.0,
"r_x3": 70.0,
"r_y3": 131.0,
"coord_origin": "TOPLEFT"
},
"text": "uan Yin, and Xian-Ling Mao.",
"orig": "uan Yin, and Xian-Ling Mao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.6,
"r_y0": 139.0,
"r_x1": 286.4,
"r_y1": 139.0,
"r_x2": 286.4,
"r_y2": 131.0,
"r_x3": 185.6,
"r_y3": 131.0,
"coord_origin": "TOPLEFT"
},
"text": "Complicated table structure",
"orig": "Complicated table structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 150.0,
"r_x1": 113.1,
"r_y1": 150.0,
"r_x2": 113.1,
"r_y2": 141.9,
"r_x3": 70.0,
"r_y3": 141.9,
"coord_origin": "TOPLEFT"
},
"text": "recognition.",
"orig": "recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.3,
"r_y0": 149.8,
"r_x1": 235.3,
"r_y1": 149.8,
"r_x2": 235.3,
"r_y2": 142.0,
"r_x3": 116.3,
"r_y3": 142.0,
"coord_origin": "TOPLEFT"
},
"text": "arXiv preprint arXiv:1908.04729",
"orig": "arXiv preprint arXiv:1908.04729",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 235.3,
"r_y0": 150.0,
"r_x1": 267.7,
"r_y1": 150.0,
"r_x2": 267.7,
"r_y2": 141.9,
"r_x3": 235.3,
"r_y3": 141.9,
"coord_origin": "TOPLEFT"
},
"text": ", 2019. 3",
"orig": ", 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[2] Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanxuan Yin, and Xian-Ling Mao. Complicated table structure recognition. arXiv preprint arXiv:1908.04729 , 2019. 3"
},
{
"label": "list_item",
"id": 7,
"page_no": 8,
"cluster": {
"id": 7,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 153.2,
"r": 286.4,
"b": 183.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 161.2,
"r_x1": 65.1,
"r_y1": 161.2,
"r_x2": 65.1,
"r_y2": 153.2,
"r_x3": 54.6,
"r_y3": 153.2,
"coord_origin": "TOPLEFT"
},
"text": "[3]",
"orig": "[3]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.4,
"r_y0": 161.2,
"r_x1": 218.8,
"r_y1": 161.2,
"r_x2": 218.8,
"r_y2": 153.2,
"r_x3": 67.4,
"r_y3": 153.2,
"coord_origin": "TOPLEFT"
},
"text": "Bertrand Couasnon and Aurelie Lemaitre.",
"orig": "Bertrand Couasnon and Aurelie Lemaitre.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 221.0,
"r_y0": 161.0,
"r_x1": 286.4,
"r_y1": 161.0,
"r_x2": 286.4,
"r_y2": 153.3,
"r_x3": 221.0,
"r_y3": 153.3,
"coord_origin": "TOPLEFT"
},
"text": "Recognition of Ta-",
"orig": "Recognition of Ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 172.0,
"r_x1": 125.3,
"r_y1": 172.0,
"r_x2": 125.3,
"r_y2": 164.3,
"r_x3": 70.0,
"r_y3": 164.3,
"coord_origin": "TOPLEFT"
},
"text": "bles and Forms",
"orig": "bles and Forms",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.3,
"r_y0": 172.2,
"r_x1": 286.4,
"r_y1": 172.2,
"r_x2": 286.4,
"r_y2": 164.2,
"r_x3": 125.3,
"r_y3": 164.2,
"coord_origin": "TOPLEFT"
},
"text": ", pages 647-677. Springer London, London,",
"orig": ", pages 647-677. Springer London, London,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 183.2,
"r_x1": 97.9,
"r_y1": 183.2,
"r_x2": 97.9,
"r_y2": 175.1,
"r_x3": 70.0,
"r_y3": 175.1,
"coord_origin": "TOPLEFT"
},
"text": "2014. 2",
"orig": "2014. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[3] Bertrand Couasnon and Aurelie Lemaitre. Recognition of Tables and Forms , pages 647-677. Springer London, London, 2014. 2"
},
{
"label": "list_item",
"id": 0,
"page_no": 8,
"cluster": {
"id": 0,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 186.4,
"r": 286.4,
"b": 227.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 194.4,
"r_x1": 65.8,
"r_y1": 194.4,
"r_x2": 65.8,
"r_y2": 186.4,
"r_x3": 54.6,
"r_y3": 186.4,
"coord_origin": "TOPLEFT"
},
"text": "[4]",
"orig": "[4]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.2,
"r_y0": 194.4,
"r_x1": 286.4,
"r_y1": 194.4,
"r_x2": 286.4,
"r_y2": 186.4,
"r_x3": 68.2,
"r_y3": 186.4,
"coord_origin": "TOPLEFT"
},
"text": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun",
"orig": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 205.4,
"r_x1": 286.4,
"r_y1": 205.4,
"r_x2": 286.4,
"r_y2": 197.4,
"r_x3": 70.0,
"r_y3": 197.4,
"coord_origin": "TOPLEFT"
},
"text": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-",
"orig": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 216.3,
"r_x1": 286.4,
"r_y1": 216.3,
"r_x2": 286.4,
"r_y2": 208.3,
"r_x3": 70.0,
"r_y3": 208.3,
"coord_origin": "TOPLEFT"
},
"text": "DAR 2019 Competition on Table Detection and Recognition",
"orig": "DAR 2019 Competition on Table Detection and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 227.3,
"r_x1": 245.8,
"r_y1": 227.3,
"r_x2": 245.8,
"r_y2": 219.3,
"r_x3": 70.0,
"r_y3": 219.3,
"coord_origin": "TOPLEFT"
},
"text": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2",
"orig": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[4] Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. ICDAR 2019 Competition on Table Detection and Recognition (cTDaR), Apr. 2019. http://sac.founderit.com/. 2"
},
{
"label": "list_item",
"id": 1,
"page_no": 8,
"cluster": {
"id": 1,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 230.6,
"r": 286.4,
"b": 271.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 238.6,
"r_x1": 65.4,
"r_y1": 238.6,
"r_x2": 65.4,
"r_y2": 230.6,
"r_x3": 54.6,
"r_y3": 230.6,
"coord_origin": "TOPLEFT"
},
"text": "[5]",
"orig": "[5]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.7,
"r_y0": 238.6,
"r_x1": 286.4,
"r_y1": 238.6,
"r_x2": 286.4,
"r_y2": 230.6,
"r_x3": 67.7,
"r_y3": 230.6,
"coord_origin": "TOPLEFT"
},
"text": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and",
"orig": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 249.5,
"r_x1": 286.4,
"r_y1": 249.5,
"r_x2": 286.4,
"r_y2": 241.5,
"r_x3": 70.0,
"r_y3": 241.5,
"coord_origin": "TOPLEFT"
},
"text": "Stavros J Perantonis. Automatic table detection in document",
"orig": "Stavros J Perantonis. Automatic table detection in document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 260.5,
"r_x1": 108.4,
"r_y1": 260.5,
"r_x2": 108.4,
"r_y2": 252.5,
"r_x3": 70.0,
"r_y3": 252.5,
"coord_origin": "TOPLEFT"
},
"text": "images. In",
"orig": "images. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.6,
"r_y0": 260.3,
"r_x1": 286.4,
"r_y1": 260.3,
"r_x2": 286.4,
"r_y2": 252.6,
"r_x3": 110.6,
"r_y3": 252.6,
"coord_origin": "TOPLEFT"
},
"text": "International Conference on Pattern Recognition",
"orig": "International Conference on Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 271.2,
"r_x1": 140.6,
"r_y1": 271.2,
"r_x2": 140.6,
"r_y2": 263.5,
"r_x3": 70.0,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "and Image Analysis",
"orig": "and Image Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.6,
"r_y0": 271.5,
"r_x1": 266.5,
"r_y1": 271.5,
"r_x2": 266.5,
"r_y2": 263.4,
"r_x3": 140.6,
"r_y3": 263.4,
"coord_origin": "TOPLEFT"
},
"text": ", pages 609-618. Springer, 2005. 2",
"orig": ", pages 609-618. Springer, 2005. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[5] Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and Stavros J Perantonis. Automatic table detection in document images. In International Conference on Pattern Recognition and Image Analysis , pages 609-618. Springer, 2005. 2"
},
{
"label": "list_item",
"id": 2,
"page_no": 8,
"cluster": {
"id": 2,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 274.7,
"r": 286.4,
"b": 315.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 282.7,
"r_x1": 64.8,
"r_y1": 282.7,
"r_x2": 64.8,
"r_y2": 274.7,
"r_x3": 54.6,
"r_y3": 274.7,
"coord_origin": "TOPLEFT"
},
"text": "[6]",
"orig": "[6]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.0,
"r_y0": 282.7,
"r_x1": 286.4,
"r_y1": 282.7,
"r_x2": 286.4,
"r_y2": 274.7,
"r_x3": 67.0,
"r_y3": 274.7,
"coord_origin": "TOPLEFT"
},
"text": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.",
"orig": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 293.7,
"r_x1": 179.6,
"r_y1": 293.7,
"r_x2": 179.6,
"r_y2": 285.7,
"r_x3": 70.0,
"r_y3": 285.7,
"coord_origin": "TOPLEFT"
},
"text": "Icdar 2013 table competition.",
"orig": "Icdar 2013 table competition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.0,
"r_y0": 293.7,
"r_x1": 194.5,
"r_y1": 293.7,
"r_x2": 194.5,
"r_y2": 285.7,
"r_x3": 187.0,
"r_y3": 285.7,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 198.0,
"r_y0": 293.5,
"r_x1": 286.4,
"r_y1": 293.5,
"r_x2": 286.4,
"r_y2": 285.7,
"r_x3": 198.0,
"r_y3": 285.7,
"coord_origin": "TOPLEFT"
},
"text": "2013 12th International",
"orig": "2013 12th International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 304.4,
"r_x1": 260.2,
"r_y1": 304.4,
"r_x2": 260.2,
"r_y2": 296.7,
"r_x3": 70.0,
"r_y3": 296.7,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Document Analysis and Recognition",
"orig": "Conference on Document Analysis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 260.2,
"r_y0": 304.6,
"r_x1": 286.4,
"r_y1": 304.6,
"r_x2": 286.4,
"r_y2": 296.6,
"r_x3": 260.2,
"r_y3": 296.6,
"coord_origin": "TOPLEFT"
},
"text": ", pages",
"orig": ", pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 315.6,
"r_x1": 142.7,
"r_y1": 315.6,
"r_x2": 142.7,
"r_y2": 307.6,
"r_x3": 70.0,
"r_y3": 307.6,
"coord_origin": "TOPLEFT"
},
"text": "1449-1453, 2013. 2",
"orig": "1449-1453, 2013. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[6] Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi. Icdar 2013 table competition. In 2013 12th International Conference on Document Analysis and Recognition , pages 1449-1453, 2013. 2"
},
{
"label": "list_item",
"id": 4,
"page_no": 8,
"cluster": {
"id": 4,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 318.9,
"r": 286.4,
"b": 348.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 326.9,
"r_x1": 65.6,
"r_y1": 326.9,
"r_x2": 65.6,
"r_y2": 318.9,
"r_x3": 54.6,
"r_y3": 318.9,
"coord_origin": "TOPLEFT"
},
"text": "[7]",
"orig": "[7]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.0,
"r_y0": 326.9,
"r_x1": 199.5,
"r_y1": 326.9,
"r_x2": 199.5,
"r_y2": 318.9,
"r_x3": 68.0,
"r_y3": 318.9,
"coord_origin": "TOPLEFT"
},
"text": "EA Green and M Krishnamoorthy.",
"orig": "EA Green and M Krishnamoorthy.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.0,
"r_y0": 326.9,
"r_x1": 286.4,
"r_y1": 326.9,
"r_x2": 286.4,
"r_y2": 318.9,
"r_x3": 207.0,
"r_y3": 318.9,
"coord_origin": "TOPLEFT"
},
"text": "Recognition of tables",
"orig": "Recognition of tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 337.8,
"r_x1": 176.3,
"r_y1": 337.8,
"r_x2": 176.3,
"r_y2": 329.8,
"r_x3": 70.0,
"r_y3": 329.8,
"coord_origin": "TOPLEFT"
},
"text": "using table grammars. procs.",
"orig": "using table grammars. procs.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.6,
"r_y0": 337.8,
"r_x1": 190.1,
"r_y1": 337.8,
"r_x2": 190.1,
"r_y2": 329.8,
"r_x3": 182.6,
"r_y3": 329.8,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 193.3,
"r_y0": 337.6,
"r_x1": 286.4,
"r_y1": 337.6,
"r_x2": 286.4,
"r_y2": 329.9,
"r_x3": 193.3,
"r_y3": 329.9,
"coord_origin": "TOPLEFT"
},
"text": "Symposium on Document",
"orig": "Symposium on Document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 348.6,
"r_x1": 206.3,
"r_y1": 348.6,
"r_x2": 206.3,
"r_y2": 340.9,
"r_x3": 70.0,
"r_y3": 340.9,
"coord_origin": "TOPLEFT"
},
"text": "Analysis and Recognition (SDAIR\u201995)",
"orig": "Analysis and Recognition (SDAIR\u201995)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.3,
"r_y0": 348.8,
"r_x1": 274.8,
"r_y1": 348.8,
"r_x2": 274.8,
"r_y2": 340.8,
"r_x3": 206.3,
"r_y3": 340.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 261-277. 2",
"orig": ", pages 261-277. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[7] EA Green and M Krishnamoorthy. Recognition of tables using table grammars. procs. In Symposium on Document Analysis and Recognition (SDAIR'95) , pages 261-277. 2"
},
{
"label": "list_item",
"id": 3,
"page_no": 8,
"cluster": {
"id": 3,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 352.0,
"r": 286.4,
"b": 403.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 360.1,
"r_x1": 65.0,
"r_y1": 360.1,
"r_x2": 65.0,
"r_y2": 352.0,
"r_x3": 54.6,
"r_y3": 352.0,
"coord_origin": "TOPLEFT"
},
"text": "[8]",
"orig": "[8]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.3,
"r_y0": 360.1,
"r_x1": 286.4,
"r_y1": 360.1,
"r_x2": 286.4,
"r_y2": 352.0,
"r_x3": 67.3,
"r_y3": 352.0,
"coord_origin": "TOPLEFT"
},
"text": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-",
"orig": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 371.0,
"r_x1": 234.1,
"r_y1": 371.0,
"r_x2": 234.1,
"r_y2": 363.0,
"r_x3": 70.0,
"r_y3": 363.0,
"coord_origin": "TOPLEFT"
},
"text": "dier Stricker, and Muhammad Zeshan Afzal.",
"orig": "dier Stricker, and Muhammad Zeshan Afzal.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 240.1,
"r_y0": 371.0,
"r_x1": 286.4,
"r_y1": 371.0,
"r_x2": 286.4,
"r_y2": 363.0,
"r_x3": 240.1,
"r_y3": 363.0,
"coord_origin": "TOPLEFT"
},
"text": "Castabdetec-",
"orig": "Castabdetec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 382.0,
"r_x1": 286.4,
"r_y1": 382.0,
"r_x2": 286.4,
"r_y2": 374.0,
"r_x3": 70.0,
"r_y3": 374.0,
"coord_origin": "TOPLEFT"
},
"text": "tors: Cascade network for table detection in document im-",
"orig": "tors: Cascade network for table detection in document im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 392.9,
"r_x1": 286.4,
"r_y1": 392.9,
"r_x2": 286.4,
"r_y2": 384.9,
"r_x3": 70.0,
"r_y3": 384.9,
"coord_origin": "TOPLEFT"
},
"text": "ages with recursive feature pyramid and switchable atrous",
"orig": "ages with recursive feature pyramid and switchable atrous",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 403.9,
"r_x1": 114.6,
"r_y1": 403.9,
"r_x2": 114.6,
"r_y2": 395.9,
"r_x3": 70.0,
"r_y3": 395.9,
"coord_origin": "TOPLEFT"
},
"text": "convolution.",
"orig": "convolution.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 117.8,
"r_y0": 403.7,
"r_x1": 186.7,
"r_y1": 403.7,
"r_x2": 186.7,
"r_y2": 396.0,
"r_x3": 117.8,
"r_y3": 396.0,
"coord_origin": "TOPLEFT"
},
"text": "Journal of Imaging",
"orig": "Journal of Imaging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 186.7,
"r_y0": 403.9,
"r_x1": 243.0,
"r_y1": 403.9,
"r_x2": 243.0,
"r_y2": 395.9,
"r_x3": 186.7,
"r_y3": 395.9,
"coord_origin": "TOPLEFT"
},
"text": ", 7(10), 2021. 1",
"orig": ", 7(10), 2021. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[8] Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Didier Stricker, and Muhammad Zeshan Afzal. Castabdetectors: Cascade network for table detection in document images with recursive feature pyramid and switchable atrous convolution. Journal of Imaging , 7(10), 2021. 1"
},
{
"label": "list_item",
"id": 10,
"page_no": 8,
"cluster": {
"id": 10,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 407.2,
"r": 286.4,
"b": 437.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 415.2,
"r_x1": 65.3,
"r_y1": 415.2,
"r_x2": 65.3,
"r_y2": 407.2,
"r_x3": 54.6,
"r_y3": 407.2,
"coord_origin": "TOPLEFT"
},
"text": "[9]",
"orig": "[9]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.6,
"r_y0": 415.2,
"r_x1": 286.4,
"r_y1": 415.2,
"r_x2": 286.4,
"r_y2": 407.2,
"r_x3": 67.6,
"r_y3": 407.2,
"coord_origin": "TOPLEFT"
},
"text": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-",
"orig": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 426.1,
"r_x1": 147.1,
"r_y1": 426.1,
"r_x2": 147.1,
"r_y2": 418.1,
"r_x3": 70.0,
"r_y3": 418.1,
"coord_origin": "TOPLEFT"
},
"text": "shick. Mask r-cnn. In",
"orig": "shick. Mask r-cnn. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 149.2,
"r_y0": 425.9,
"r_x1": 286.4,
"r_y1": 425.9,
"r_x2": 286.4,
"r_y2": 418.2,
"r_x3": 149.2,
"r_y3": 418.2,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE International",
"orig": "Proceedings of the IEEE International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 436.9,
"r_x1": 213.5,
"r_y1": 436.9,
"r_x2": 213.5,
"r_y2": 429.2,
"r_x3": 70.0,
"r_y3": 429.2,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision (ICCV)",
"orig": "Conference on Computer Vision (ICCV)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 213.5,
"r_y0": 437.1,
"r_x1": 261.0,
"r_y1": 437.1,
"r_x2": 261.0,
"r_y2": 429.1,
"r_x3": 213.5,
"r_y3": 429.1,
"coord_origin": "TOPLEFT"
},
"text": ", Oct 2017. 1",
"orig": ", Oct 2017. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[9] Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Girshick. Mask r-cnn. In Proceedings of the IEEE International Conference on Computer Vision (ICCV) , Oct 2017. 1"
},
{
"label": "list_item",
"id": 14,
"page_no": 8,
"cluster": {
"id": 14,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 440.3,
"r": 286.4,
"b": 481.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 448.4,
"r_x1": 65.4,
"r_y1": 448.4,
"r_x2": 65.4,
"r_y2": 440.3,
"r_x3": 50.1,
"r_y3": 440.3,
"coord_origin": "TOPLEFT"
},
"text": "[10]",
"orig": "[10]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.7,
"r_y0": 448.4,
"r_x1": 286.4,
"r_y1": 448.4,
"r_x2": 286.4,
"r_y2": 440.3,
"r_x3": 67.7,
"r_y3": 440.3,
"coord_origin": "TOPLEFT"
},
"text": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-",
"orig": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 459.3,
"r_x1": 202.7,
"r_y1": 459.3,
"r_x2": 202.7,
"r_y2": 451.3,
"r_x3": 70.0,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": "cong Li, Xin Tang, and Rong Xiao.",
"orig": "cong Li, Xin Tang, and Rong Xiao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 459.3,
"r_x1": 286.4,
"r_y1": 459.3,
"r_x2": 286.4,
"r_y2": 451.3,
"r_x3": 209.0,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": "Pingan-vcgroup\u2019s so-",
"orig": "Pingan-vcgroup\u2019s so-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 470.3,
"r_x1": 286.4,
"r_y1": 470.3,
"r_x2": 286.4,
"r_y2": 462.3,
"r_x3": 70.0,
"r_y3": 462.3,
"coord_origin": "TOPLEFT"
},
"text": "lution for icdar 2021 competition on scientific table image",
"orig": "lution for icdar 2021 competition on scientific table image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 481.2,
"r_x1": 141.9,
"r_y1": 481.2,
"r_x2": 141.9,
"r_y2": 473.2,
"r_x3": 70.0,
"r_y3": 473.2,
"coord_origin": "TOPLEFT"
},
"text": "recognition to latex.",
"orig": "recognition to latex.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 145.1,
"r_y0": 481.0,
"r_x1": 166.0,
"r_y1": 481.0,
"r_x2": 166.0,
"r_y2": 473.3,
"r_x3": 145.1,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "ArXiv",
"orig": "ArXiv",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 166.0,
"r_y0": 481.2,
"r_x1": 259.9,
"r_y1": 481.2,
"r_x2": 259.9,
"r_y2": 473.2,
"r_x3": 166.0,
"r_y3": 473.2,
"coord_origin": "TOPLEFT"
},
"text": ", abs/2105.01846, 2021. 2",
"orig": ", abs/2105.01846, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[10] Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bingcong Li, Xin Tang, and Rong Xiao. Pingan-vcgroup's solution for icdar 2021 competition on scientific table image recognition to latex. ArXiv , abs/2105.01846, 2021. 2"
},
{
"label": "list_item",
"id": 11,
"page_no": 8,
"cluster": {
"id": 11,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 484.5,
"r": 286.4,
"b": 536.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 492.5,
"r_x1": 66.0,
"r_y1": 492.5,
"r_x2": 66.0,
"r_y2": 484.5,
"r_x3": 50.1,
"r_y3": 484.5,
"coord_origin": "TOPLEFT"
},
"text": "[11]",
"orig": "[11]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.4,
"r_y0": 492.5,
"r_x1": 286.4,
"r_y1": 492.5,
"r_x2": 286.4,
"r_y2": 484.5,
"r_x3": 68.4,
"r_y3": 484.5,
"coord_origin": "TOPLEFT"
},
"text": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and",
"orig": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 503.5,
"r_x1": 286.4,
"r_y1": 503.5,
"r_x2": 286.4,
"r_y2": 495.4,
"r_x3": 70.0,
"r_y3": 495.4,
"coord_origin": "TOPLEFT"
},
"text": "Gordon Wilfong. Medium-independent table detection. In",
"orig": "Gordon Wilfong. Medium-independent table detection. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 514.2,
"r_x1": 227.4,
"r_y1": 514.2,
"r_x2": 227.4,
"r_y2": 506.5,
"r_x3": 70.0,
"r_y3": 506.5,
"coord_origin": "TOPLEFT"
},
"text": "Document Recognition and Retrieval VII",
"orig": "Document Recognition and Retrieval VII",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.4,
"r_y0": 514.4,
"r_x1": 286.4,
"r_y1": 514.4,
"r_x2": 286.4,
"r_y2": 506.4,
"r_x3": 227.4,
"r_y3": 506.4,
"coord_origin": "TOPLEFT"
},
"text": ", volume 3967,",
"orig": ", volume 3967,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 525.4,
"r_x1": 286.4,
"r_y1": 525.4,
"r_x2": 286.4,
"r_y2": 517.4,
"r_x3": 70.0,
"r_y3": 517.4,
"coord_origin": "TOPLEFT"
},
"text": "pages 291-302. International Society for Optics and Photon-",
"orig": "pages 291-302. International Society for Optics and Photon-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 536.3,
"r_x1": 112.4,
"r_y1": 536.3,
"r_x2": 112.4,
"r_y2": 528.3,
"r_x3": 70.0,
"r_y3": 528.3,
"coord_origin": "TOPLEFT"
},
"text": "ics, 1999. 2",
"orig": "ics, 1999. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[11] Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and Gordon Wilfong. Medium-independent table detection. In Document Recognition and Retrieval VII , volume 3967, pages 291-302. International Society for Optics and Photonics, 1999. 2"
},
{
"label": "list_item",
"id": 5,
"page_no": 8,
"cluster": {
"id": 5,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 539.6,
"r": 286.4,
"b": 591.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 547.6,
"r_x1": 65.5,
"r_y1": 547.6,
"r_x2": 65.5,
"r_y2": 539.6,
"r_x3": 50.1,
"r_y3": 539.6,
"coord_origin": "TOPLEFT"
},
"text": "[12]",
"orig": "[12]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 547.6,
"r_x1": 286.4,
"r_y1": 547.6,
"r_x2": 286.4,
"r_y2": 539.6,
"r_x3": 67.8,
"r_y3": 539.6,
"coord_origin": "TOPLEFT"
},
"text": "Matthew Hurst. A constraint-based approach to table struc-",
"orig": "Matthew Hurst. A constraint-based approach to table struc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 558.6,
"r_x1": 136.3,
"r_y1": 558.6,
"r_x2": 136.3,
"r_y2": 550.6,
"r_x3": 70.0,
"r_y3": 550.6,
"coord_origin": "TOPLEFT"
},
"text": "ture derivation. In",
"orig": "ture derivation. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.8,
"r_y0": 558.4,
"r_x1": 286.4,
"r_y1": 558.4,
"r_x2": 286.4,
"r_y2": 550.6,
"r_x3": 138.8,
"r_y3": 550.6,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the Seventh International",
"orig": "Proceedings of the Seventh International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 569.3,
"r_x1": 286.4,
"r_y1": 569.3,
"r_x2": 286.4,
"r_y2": 561.6,
"r_x3": 70.0,
"r_y3": 561.6,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Document Analysis and Recognition - Volume",
"orig": "Conference on Document Analysis and Recognition - Volume",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 580.3,
"r_x1": 74.5,
"r_y1": 580.3,
"r_x2": 74.5,
"r_y2": 572.6,
"r_x3": 70.0,
"r_y3": 572.6,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.5,
"r_y0": 580.5,
"r_x1": 286.4,
"r_y1": 580.5,
"r_x2": 286.4,
"r_y2": 572.5,
"r_x3": 74.5,
"r_y3": 572.5,
"coord_origin": "TOPLEFT"
},
"text": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-",
"orig": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 591.4,
"r_x1": 90.4,
"r_y1": 591.4,
"r_x2": 90.4,
"r_y2": 583.4,
"r_x3": 70.0,
"r_y3": 583.4,
"coord_origin": "TOPLEFT"
},
"text": "ety. 2",
"orig": "ety. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[12] Matthew Hurst. A constraint-based approach to table structure derivation. In Proceedings of the Seventh International Conference on Document Analysis and Recognition - Volume 2 , ICDAR '03, page 911, USA, 2003. IEEE Computer Society. 2"
},
{
"label": "list_item",
"id": 13,
"page_no": 8,
"cluster": {
"id": 13,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 594.7,
"r": 286.4,
"b": 646.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 602.7,
"r_x1": 66.3,
"r_y1": 602.7,
"r_x2": 66.3,
"r_y2": 594.7,
"r_x3": 50.1,
"r_y3": 594.7,
"coord_origin": "TOPLEFT"
},
"text": "[13]",
"orig": "[13]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.7,
"r_y0": 602.7,
"r_x1": 286.4,
"r_y1": 602.7,
"r_x2": 286.4,
"r_y2": 594.7,
"r_x3": 68.7,
"r_y3": 594.7,
"coord_origin": "TOPLEFT"
},
"text": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,",
"orig": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 613.7,
"r_x1": 286.4,
"r_y1": 613.7,
"r_x2": 286.4,
"r_y2": 605.7,
"r_x3": 70.0,
"r_y3": 605.7,
"coord_origin": "TOPLEFT"
},
"text": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect",
"orig": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 624.6,
"r_x1": 286.4,
"r_y1": 624.6,
"r_x2": 286.4,
"r_y2": 616.6,
"r_x3": 70.0,
"r_y3": 616.6,
"coord_origin": "TOPLEFT"
},
"text": "tables in scanned document images using line information.",
"orig": "tables in scanned document images using line information.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 635.6,
"r_x1": 77.5,
"r_y1": 635.6,
"r_x2": 77.5,
"r_y2": 627.6,
"r_x3": 70.0,
"r_y3": 627.6,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 79.9,
"r_y0": 635.4,
"r_x1": 286.4,
"r_y1": 635.4,
"r_x2": 286.4,
"r_y2": 627.7,
"r_x3": 79.9,
"r_y3": 627.7,
"coord_origin": "TOPLEFT"
},
"text": "2013 12th International Conference on Document Analy-",
"orig": "2013 12th International Conference on Document Analy-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 646.4,
"r_x1": 140.7,
"r_y1": 646.4,
"r_x2": 140.7,
"r_y2": 638.6,
"r_x3": 70.0,
"r_y3": 638.6,
"coord_origin": "TOPLEFT"
},
"text": "sis and Recognition",
"orig": "sis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.7,
"r_y0": 646.6,
"r_x1": 264.4,
"r_y1": 646.6,
"r_x2": 264.4,
"r_y2": 638.5,
"r_x3": 140.7,
"r_y3": 638.5,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1185-1189. IEEE, 2013. 2",
"orig": ", pages 1185-1189. IEEE, 2013. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[13] Thotreingam Kasar, Philippine Barlas, Sebastien Adam, Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect tables in scanned document images using line information. In 2013 12th International Conference on Document Analysis and Recognition , pages 1185-1189. IEEE, 2013. 2"
},
{
"label": "list_item",
"id": 17,
"page_no": 8,
"cluster": {
"id": 17,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 649.8,
"r": 286.4,
"b": 679.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 657.8,
"r_x1": 66.5,
"r_y1": 657.8,
"r_x2": 66.5,
"r_y2": 649.8,
"r_x3": 50.1,
"r_y3": 649.8,
"coord_origin": "TOPLEFT"
},
"text": "[14]",
"orig": "[14]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 69.0,
"r_y0": 657.8,
"r_x1": 286.4,
"r_y1": 657.8,
"r_x2": 286.4,
"r_y2": 649.8,
"r_x3": 69.0,
"r_y3": 649.8,
"coord_origin": "TOPLEFT"
},
"text": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank",
"orig": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 668.8,
"r_x1": 93.2,
"r_y1": 668.8,
"r_x2": 93.2,
"r_y2": 660.8,
"r_x3": 70.0,
"r_y3": 660.8,
"coord_origin": "TOPLEFT"
},
"text": "Singh.",
"orig": "Singh.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 102.2,
"r_y0": 668.8,
"r_x1": 286.4,
"r_y1": 668.8,
"r_x2": 286.4,
"r_y2": 660.8,
"r_x3": 102.2,
"r_y3": 660.8,
"coord_origin": "TOPLEFT"
},
"text": "Icdar 2021 competition on scientific table image",
"orig": "Icdar 2021 competition on scientific table image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 679.7,
"r_x1": 172.0,
"r_y1": 679.7,
"r_x2": 172.0,
"r_y2": 671.7,
"r_x3": 70.0,
"r_y3": 671.7,
"coord_origin": "TOPLEFT"
},
"text": "recognition to latex, 2021. 2",
"orig": "recognition to latex, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[14] Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank Singh. Icdar 2021 competition on scientific table image recognition to latex, 2021. 2"
},
{
"label": "list_item",
"id": 16,
"page_no": 8,
"cluster": {
"id": 16,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 683.0,
"r": 286.4,
"b": 712.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 691.0,
"r_x1": 65.5,
"r_y1": 691.0,
"r_x2": 65.5,
"r_y2": 683.0,
"r_x3": 50.1,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "[15]",
"orig": "[15]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 691.0,
"r_x1": 286.4,
"r_y1": 691.0,
"r_x2": 286.4,
"r_y2": 683.0,
"r_x3": 67.8,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Harold W Kuhn. The hungarian method for the assignment",
"orig": "Harold W Kuhn. The hungarian method for the assignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 702.0,
"r_x1": 102.2,
"r_y1": 702.0,
"r_x2": 102.2,
"r_y2": 694.0,
"r_x3": 70.0,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "problem.",
"orig": "problem.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 107.5,
"r_y0": 701.8,
"r_x1": 231.5,
"r_y1": 701.8,
"r_x2": 231.5,
"r_y2": 694.0,
"r_x3": 107.5,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Naval research logistics quarterly",
"orig": "Naval research logistics quarterly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 231.5,
"r_y0": 702.0,
"r_x1": 286.4,
"r_y1": 702.0,
"r_x2": 286.4,
"r_y2": 694.0,
"r_x3": 231.5,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": ", 2(1-2):83-97,",
"orig": ", 2(1-2):83-97,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 712.9,
"r_x1": 97.9,
"r_y1": 712.9,
"r_x2": 97.9,
"r_y2": 704.9,
"r_x3": 70.0,
"r_y3": 704.9,
"coord_origin": "TOPLEFT"
},
"text": "1955. 6",
"orig": "1955. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[15] Harold W Kuhn. The hungarian method for the assignment problem. Naval research logistics quarterly , 2(1-2):83-97, 1955. 6"
},
{
"label": "list_item",
"id": 6,
"page_no": 8,
"cluster": {
"id": 6,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 75.9,
"r": 545.1,
"b": 138.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 83.9,
"r_x1": 324.7,
"r_y1": 83.9,
"r_x2": 324.7,
"r_y2": 75.9,
"r_x3": 308.9,
"r_y3": 75.9,
"coord_origin": "TOPLEFT"
},
"text": "[16]",
"orig": "[16]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.1,
"r_y0": 83.9,
"r_x1": 545.1,
"r_y1": 83.9,
"r_x2": 545.1,
"r_y2": 75.9,
"r_x3": 327.1,
"r_y3": 75.9,
"coord_origin": "TOPLEFT"
},
"text": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-",
"orig": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 94.9,
"r_x1": 545.1,
"r_y1": 94.9,
"r_x2": 545.1,
"r_y2": 86.8,
"r_x3": 328.8,
"r_y3": 86.8,
"coord_origin": "TOPLEFT"
},
"text": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and",
"orig": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 105.8,
"r_x1": 391.0,
"r_y1": 105.8,
"r_x2": 391.0,
"r_y2": 97.8,
"r_x3": 328.8,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Tamara L. Berg.",
"orig": "Tamara L. Berg.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.3,
"r_y0": 105.8,
"r_x1": 435.1,
"r_y1": 105.8,
"r_x2": 435.1,
"r_y2": 97.8,
"r_x3": 400.3,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Babytalk:",
"orig": "Babytalk:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.7,
"r_y0": 105.8,
"r_x1": 545.1,
"r_y1": 105.8,
"r_x2": 545.1,
"r_y2": 97.8,
"r_x3": 441.7,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Understanding and generat-",
"orig": "Understanding and generat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 116.8,
"r_x1": 440.8,
"r_y1": 116.8,
"r_x2": 440.8,
"r_y2": 108.8,
"r_x3": 328.8,
"r_y3": 108.8,
"coord_origin": "TOPLEFT"
},
"text": "ing simple image descriptions.",
"orig": "ing simple image descriptions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 446.6,
"r_y0": 116.6,
"r_x1": 545.1,
"r_y1": 116.6,
"r_x2": 545.1,
"r_y2": 108.8,
"r_x3": 446.6,
"r_y3": 108.8,
"coord_origin": "TOPLEFT"
},
"text": "IEEE Transactions on Pat-",
"orig": "IEEE Transactions on Pat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 127.5,
"r_x1": 471.1,
"r_y1": 127.5,
"r_x2": 471.1,
"r_y2": 119.8,
"r_x3": 328.8,
"r_y3": 119.8,
"coord_origin": "TOPLEFT"
},
"text": "tern Analysis and Machine Intelligence",
"orig": "tern Analysis and Machine Intelligence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 471.1,
"r_y0": 127.7,
"r_x1": 545.1,
"r_y1": 127.7,
"r_x2": 545.1,
"r_y2": 119.7,
"r_x3": 471.1,
"r_y3": 119.7,
"coord_origin": "TOPLEFT"
},
"text": ", 35(12):2891-2903,",
"orig": ", 35(12):2891-2903,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 138.7,
"r_x1": 356.7,
"r_y1": 138.7,
"r_x2": 356.7,
"r_y2": 130.7,
"r_x3": 328.8,
"r_y3": 130.7,
"coord_origin": "TOPLEFT"
},
"text": "2013. 4",
"orig": "2013. 4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[16] Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sagnik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and Tamara L. Berg. Babytalk: Understanding and generating simple image descriptions. IEEE Transactions on Pattern Analysis and Machine Intelligence , 35(12):2891-2903, 2013. 4"
},
{
"label": "list_item",
"id": 15,
"page_no": 8,
"cluster": {
"id": 15,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 142.1,
"r": 545.1,
"b": 172.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 150.1,
"r_x1": 325.2,
"r_y1": 150.1,
"r_x2": 325.2,
"r_y2": 142.1,
"r_x3": 308.9,
"r_y3": 142.1,
"coord_origin": "TOPLEFT"
},
"text": "[17]",
"orig": "[17]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.7,
"r_y0": 150.1,
"r_x1": 545.1,
"r_y1": 150.1,
"r_x2": 545.1,
"r_y2": 142.1,
"r_x3": 327.7,
"r_y3": 142.1,
"coord_origin": "TOPLEFT"
},
"text": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming",
"orig": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 161.1,
"r_x1": 414.4,
"r_y1": 161.1,
"r_x2": 414.4,
"r_y2": 153.1,
"r_x3": 328.8,
"r_y3": 153.1,
"coord_origin": "TOPLEFT"
},
"text": "Zhou, and Zhoujun Li.",
"orig": "Zhou, and Zhoujun Li.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 421.8,
"r_y0": 161.1,
"r_x1": 545.1,
"r_y1": 161.1,
"r_x2": 545.1,
"r_y2": 153.1,
"r_x3": 421.8,
"r_y3": 153.1,
"coord_origin": "TOPLEFT"
},
"text": "Tablebank: A benchmark dataset",
"orig": "Tablebank: A benchmark dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 172.1,
"r_x1": 493.6,
"r_y1": 172.1,
"r_x2": 493.6,
"r_y2": 164.0,
"r_x3": 328.8,
"r_y3": 164.0,
"coord_origin": "TOPLEFT"
},
"text": "for table detection and recognition, 2019. 2, 3",
"orig": "for table detection and recognition, 2019. 2, 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[17] Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming Zhou, and Zhoujun Li. Tablebank: A benchmark dataset for table detection and recognition, 2019. 2, 3"
},
{
"label": "list_item",
"id": 12,
"page_no": 8,
"cluster": {
"id": 12,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 175.5,
"r": 545.1,
"b": 260.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 183.5,
"r_x1": 324.3,
"r_y1": 183.5,
"r_x2": 324.3,
"r_y2": 175.5,
"r_x3": 308.9,
"r_y3": 175.5,
"coord_origin": "TOPLEFT"
},
"text": "[18]",
"orig": "[18]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.6,
"r_y0": 183.5,
"r_x1": 545.1,
"r_y1": 183.5,
"r_x2": 545.1,
"r_y2": 175.5,
"r_x3": 326.6,
"r_y3": 175.5,
"coord_origin": "TOPLEFT"
},
"text": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and",
"orig": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 194.5,
"r_x1": 545.1,
"r_y1": 194.5,
"r_x2": 545.1,
"r_y2": 186.4,
"r_x3": 328.8,
"r_y3": 186.4,
"coord_origin": "TOPLEFT"
},
"text": "Xianhui Liu. Gfte: Graph-based financial table extraction.",
"orig": "Xianhui Liu. Gfte: Graph-based financial table extraction.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 205.4,
"r_x1": 545.1,
"r_y1": 205.4,
"r_x2": 545.1,
"r_y2": 197.4,
"r_x3": 328.8,
"r_y3": 197.4,
"coord_origin": "TOPLEFT"
},
"text": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-",
"orig": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 216.4,
"r_x1": 545.1,
"r_y1": 216.4,
"r_x2": 545.1,
"r_y2": 208.4,
"r_x3": 328.8,
"r_y3": 208.4,
"coord_origin": "TOPLEFT"
},
"text": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair",
"orig": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 227.3,
"r_x1": 479.3,
"r_y1": 227.3,
"r_x2": 479.3,
"r_y2": 219.3,
"r_x3": 328.8,
"r_y3": 219.3,
"coord_origin": "TOPLEFT"
},
"text": "Escalante, and Roberto Vezzani, editors,",
"orig": "Escalante, and Roberto Vezzani, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.1,
"r_y0": 227.1,
"r_x1": 545.1,
"r_y1": 227.1,
"r_x2": 545.1,
"r_y2": 219.4,
"r_x3": 483.1,
"r_y3": 219.4,
"coord_origin": "TOPLEFT"
},
"text": "Pattern Recogni-",
"orig": "Pattern Recogni-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 238.1,
"r_x1": 519.4,
"r_y1": 238.1,
"r_x2": 519.4,
"r_y2": 230.4,
"r_x3": 328.8,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "tion. ICPR International Workshops and Challenges",
"orig": "tion. ICPR International Workshops and Challenges",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 519.4,
"r_y0": 238.3,
"r_x1": 545.1,
"r_y1": 238.3,
"r_x2": 545.1,
"r_y2": 230.3,
"r_x3": 519.4,
"r_y3": 230.3,
"coord_origin": "TOPLEFT"
},
"text": ", pages",
"orig": ", pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 249.3,
"r_x1": 545.1,
"r_y1": 249.3,
"r_x2": 545.1,
"r_y2": 241.2,
"r_x3": 328.8,
"r_y3": 241.2,
"coord_origin": "TOPLEFT"
},
"text": "644-658, Cham, 2021. Springer International Publishing. 2,",
"orig": "644-658, Cham, 2021. Springer International Publishing. 2,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 260.2,
"r_x1": 333.3,
"r_y1": 260.2,
"r_x2": 333.3,
"r_y2": 252.2,
"r_x3": 328.8,
"r_y3": 252.2,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[18] Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and Xianhui Liu. Gfte: Graph-based financial table extraction. In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Giovanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair Escalante, and Roberto Vezzani, editors, Pattern Recognition. ICPR International Workshops and Challenges , pages 644-658, Cham, 2021. Springer International Publishing. 2, 3"
},
{
"label": "list_item",
"id": 8,
"page_no": 8,
"cluster": {
"id": 8,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 263.6,
"r": 545.1,
"b": 326.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 271.7,
"r_x1": 324.3,
"r_y1": 271.7,
"r_x2": 324.3,
"r_y2": 263.6,
"r_x3": 308.9,
"r_y3": 263.6,
"coord_origin": "TOPLEFT"
},
"text": "[19]",
"orig": "[19]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.6,
"r_y0": 271.7,
"r_x1": 545.1,
"r_y1": 271.7,
"r_x2": 545.1,
"r_y2": 263.6,
"r_x3": 326.6,
"r_y3": 263.6,
"coord_origin": "TOPLEFT"
},
"text": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-",
"orig": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 282.6,
"r_x1": 545.1,
"r_y1": 282.6,
"r_x2": 545.1,
"r_y2": 274.6,
"r_x3": 328.8,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele",
"orig": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 293.6,
"r_x1": 545.1,
"r_y1": 293.6,
"r_x2": 545.1,
"r_y2": 285.6,
"r_x3": 328.8,
"r_y3": 285.6,
"coord_origin": "TOPLEFT"
},
"text": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-",
"orig": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 304.5,
"r_x1": 545.1,
"r_y1": 304.5,
"r_x2": 545.1,
"r_y2": 296.5,
"r_x3": 328.8,
"r_y3": 296.5,
"coord_origin": "TOPLEFT"
},
"text": "bust pdf document conversion using recurrent neural net-",
"orig": "bust pdf document conversion using recurrent neural net-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 315.5,
"r_x1": 352.8,
"r_y1": 315.5,
"r_x2": 352.8,
"r_y2": 307.5,
"r_x3": 328.8,
"r_y3": 307.5,
"coord_origin": "TOPLEFT"
},
"text": "works.",
"orig": "works.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.2,
"r_y0": 315.3,
"r_x1": 545.1,
"r_y1": 315.3,
"r_x2": 545.1,
"r_y2": 307.6,
"r_x3": 360.2,
"r_y3": 307.6,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the AAAI Conference on Artificial",
"orig": "Proceedings of the AAAI Conference on Artificial",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 326.2,
"r_x1": 371.0,
"r_y1": 326.2,
"r_x2": 371.0,
"r_y2": 318.5,
"r_x3": 328.8,
"r_y3": 318.5,
"coord_origin": "TOPLEFT"
},
"text": "Intelligence",
"orig": "Intelligence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 371.0,
"r_y0": 326.5,
"r_x1": 502.3,
"r_y1": 326.5,
"r_x2": 502.3,
"r_y2": 318.4,
"r_x3": 371.0,
"r_y3": 318.4,
"coord_origin": "TOPLEFT"
},
"text": ", 35(17):15137-15145, May 2021. 1",
"orig": ", 35(17):15137-15145, May 2021. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[19] Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Viktor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Robust pdf document conversion using recurrent neural networks. Proceedings of the AAAI Conference on Artificial Intelligence , 35(17):15137-15145, May 2021. 1"
},
{
"label": "list_item",
"id": 18,
"page_no": 8,
"cluster": {
"id": 18,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 329.9,
"r": 545.1,
"b": 370.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 337.9,
"r_x1": 323.8,
"r_y1": 337.9,
"r_x2": 323.8,
"r_y2": 329.9,
"r_x3": 308.9,
"r_y3": 329.9,
"coord_origin": "TOPLEFT"
},
"text": "[20]",
"orig": "[20]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.1,
"r_y0": 337.9,
"r_x1": 545.1,
"r_y1": 337.9,
"r_x2": 545.1,
"r_y2": 329.9,
"r_x3": 326.1,
"r_y3": 329.9,
"coord_origin": "TOPLEFT"
},
"text": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,",
"orig": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 348.9,
"r_x1": 545.1,
"r_y1": 348.9,
"r_x2": 545.1,
"r_y2": 340.8,
"r_x3": 328.8,
"r_y3": 340.8,
"coord_origin": "TOPLEFT"
},
"text": "Yongpan Wang, and Gui-Song Xia. Parsing table structures",
"orig": "Yongpan Wang, and Gui-Song Xia. Parsing table structures",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 359.8,
"r_x1": 382.8,
"r_y1": 359.8,
"r_x2": 382.8,
"r_y2": 351.8,
"r_x3": 328.8,
"r_y3": 351.8,
"coord_origin": "TOPLEFT"
},
"text": "in the wild. In",
"orig": "in the wild. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.5,
"r_y0": 359.6,
"r_x1": 545.1,
"r_y1": 359.6,
"r_x2": 545.1,
"r_y2": 351.9,
"r_x3": 385.5,
"r_y3": 351.9,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF International",
"orig": "Proceedings of the IEEE/CVF International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 370.6,
"r_x1": 443.6,
"r_y1": 370.6,
"r_x2": 443.6,
"r_y2": 362.8,
"r_x3": 328.8,
"r_y3": 362.8,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision",
"orig": "Conference on Computer Vision",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 443.6,
"r_y0": 370.8,
"r_x1": 534.5,
"r_y1": 370.8,
"r_x2": 534.5,
"r_y2": 362.8,
"r_x3": 443.6,
"r_y3": 362.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 944-952, 2021. 2",
"orig": ", pages 944-952, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[20] Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang, Yongpan Wang, and Gui-Song Xia. Parsing table structures in the wild. In Proceedings of the IEEE/CVF International Conference on Computer Vision , pages 944-952, 2021. 2"
},
{
"label": "list_item",
"id": 21,
"page_no": 8,
"cluster": {
"id": 21,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 374.2,
"r": 545.1,
"b": 437.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 382.2,
"r_x1": 324.6,
"r_y1": 382.2,
"r_x2": 324.6,
"r_y2": 374.2,
"r_x3": 308.9,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "[21]",
"orig": "[21]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.0,
"r_y0": 382.2,
"r_x1": 362.7,
"r_y1": 382.2,
"r_x2": 362.7,
"r_y2": 374.2,
"r_x3": 327.0,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Shubham",
"orig": "Shubham",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 368.7,
"r_y0": 382.2,
"r_x1": 389.6,
"r_y1": 382.2,
"r_x2": 389.6,
"r_y2": 374.2,
"r_x3": 368.7,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Singh",
"orig": "Singh",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 395.6,
"r_y0": 382.2,
"r_x1": 424.6,
"r_y1": 382.2,
"r_x2": 424.6,
"r_y2": 374.2,
"r_x3": 395.6,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Paliwal,",
"orig": "Paliwal,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.5,
"r_y0": 382.2,
"r_x1": 438.0,
"r_y1": 382.2,
"r_x2": 438.0,
"r_y2": 374.2,
"r_x3": 431.5,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "D",
"orig": "D",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 444.1,
"r_y0": 382.2,
"r_x1": 488.5,
"r_y1": 382.2,
"r_x2": 488.5,
"r_y2": 374.2,
"r_x3": 444.1,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Vishwanath,",
"orig": "Vishwanath,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 495.5,
"r_y0": 382.2,
"r_x1": 515.4,
"r_y1": 382.2,
"r_x2": 515.4,
"r_y2": 374.2,
"r_x3": 495.5,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Rohit",
"orig": "Rohit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 521.4,
"r_y0": 382.2,
"r_x1": 545.1,
"r_y1": 382.2,
"r_x2": 545.1,
"r_y2": 374.2,
"r_x3": 521.4,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Rahul,",
"orig": "Rahul,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 393.2,
"r_x1": 545.1,
"r_y1": 393.2,
"r_x2": 545.1,
"r_y2": 385.2,
"r_x3": 328.8,
"r_y3": 385.2,
"coord_origin": "TOPLEFT"
},
"text": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-",
"orig": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 404.1,
"r_x1": 545.1,
"r_y1": 404.1,
"r_x2": 545.1,
"r_y2": 396.1,
"r_x3": 328.8,
"r_y3": 396.1,
"coord_origin": "TOPLEFT"
},
"text": "ing model for end-to-end table detection and tabular data ex-",
"orig": "ing model for end-to-end table detection and tabular data ex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 415.1,
"r_x1": 478.0,
"r_y1": 415.1,
"r_x2": 478.0,
"r_y2": 407.1,
"r_x3": 328.8,
"r_y3": 407.1,
"coord_origin": "TOPLEFT"
},
"text": "traction from scanned document images.",
"orig": "traction from scanned document images.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 484.1,
"r_y0": 415.1,
"r_x1": 491.5,
"r_y1": 415.1,
"r_x2": 491.5,
"r_y2": 407.1,
"r_x3": 484.1,
"r_y3": 407.1,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 494.7,
"r_y0": 414.9,
"r_x1": 545.1,
"r_y1": 414.9,
"r_x2": 545.1,
"r_y2": 407.2,
"r_x3": 494.7,
"r_y3": 407.2,
"coord_origin": "TOPLEFT"
},
"text": "2019 Interna-",
"orig": "2019 Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 425.9,
"r_x1": 545.1,
"r_y1": 425.9,
"r_x2": 545.1,
"r_y2": 418.1,
"r_x3": 328.8,
"r_y3": 418.1,
"coord_origin": "TOPLEFT"
},
"text": "tional Conference on Document Analysis and Recognition",
"orig": "tional Conference on Document Analysis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 436.8,
"r_x1": 360.8,
"r_y1": 436.8,
"r_x2": 360.8,
"r_y2": 429.1,
"r_x3": 328.8,
"r_y3": 429.1,
"coord_origin": "TOPLEFT"
},
"text": "(ICDAR)",
"orig": "(ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.8,
"r_y0": 437.0,
"r_x1": 475.6,
"r_y1": 437.0,
"r_x2": 475.6,
"r_y2": 429.0,
"r_x3": 360.8,
"r_y3": 429.0,
"coord_origin": "TOPLEFT"
},
"text": ", pages 128-133. IEEE, 2019. 1",
"orig": ", pages 128-133. IEEE, 2019. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[21] Shubham Singh Paliwal, D Vishwanath, Rohit Rahul, Monika Sharma, and Lovekesh Vig. Tablenet: Deep learning model for end-to-end table detection and tabular data extraction from scanned document images. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 128-133. IEEE, 2019. 1"
},
{
"label": "list_item",
"id": 20,
"page_no": 8,
"cluster": {
"id": 20,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 440.4,
"r": 545.1,
"b": 558.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 448.5,
"r_x1": 324.6,
"r_y1": 448.5,
"r_x2": 324.6,
"r_y2": 440.4,
"r_x3": 308.9,
"r_y3": 440.4,
"coord_origin": "TOPLEFT"
},
"text": "[22]",
"orig": "[22]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.9,
"r_y0": 448.5,
"r_x1": 545.1,
"r_y1": 448.5,
"r_x2": 545.1,
"r_y2": 440.4,
"r_x3": 326.9,
"r_y3": 440.4,
"coord_origin": "TOPLEFT"
},
"text": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,",
"orig": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 459.4,
"r_x1": 545.1,
"r_y1": 459.4,
"r_x2": 545.1,
"r_y2": 451.4,
"r_x3": 328.8,
"r_y3": 451.4,
"coord_origin": "TOPLEFT"
},
"text": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming",
"orig": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 470.4,
"r_x1": 545.1,
"r_y1": 470.4,
"r_x2": 545.1,
"r_y2": 462.4,
"r_x3": 328.8,
"r_y3": 462.4,
"coord_origin": "TOPLEFT"
},
"text": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,",
"orig": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 481.3,
"r_x1": 545.1,
"r_y1": 481.3,
"r_x2": 545.1,
"r_y2": 473.3,
"r_x3": 328.8,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-",
"orig": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 492.3,
"r_x1": 545.1,
"r_y1": 492.3,
"r_x2": 545.1,
"r_y2": 484.3,
"r_x3": 328.8,
"r_y3": 484.3,
"coord_origin": "TOPLEFT"
},
"text": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,",
"orig": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 503.3,
"r_x1": 545.1,
"r_y1": 503.3,
"r_x2": 545.1,
"r_y2": 495.2,
"r_x3": 328.8,
"r_y3": 495.2,
"coord_origin": "TOPLEFT"
},
"text": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-",
"orig": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 514.2,
"r_x1": 545.1,
"r_y1": 514.2,
"r_x2": 545.1,
"r_y2": 506.2,
"r_x3": 328.8,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "perative style, high-performance deep learning library. In H.",
"orig": "perative style, high-performance deep learning library. In H.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 525.2,
"r_x1": 545.1,
"r_y1": 525.2,
"r_x2": 545.1,
"r_y2": 517.2,
"r_x3": 328.8,
"r_y3": 517.2,
"coord_origin": "TOPLEFT"
},
"text": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.",
"orig": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 536.1,
"r_x1": 434.6,
"r_y1": 536.1,
"r_x2": 434.6,
"r_y2": 528.1,
"r_x3": 328.8,
"r_y3": 528.1,
"coord_origin": "TOPLEFT"
},
"text": "Fox, and R. Garnett, editors,",
"orig": "Fox, and R. Garnett, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.9,
"r_y0": 535.9,
"r_x1": 545.1,
"r_y1": 535.9,
"r_x2": 545.1,
"r_y2": 528.2,
"r_x3": 437.9,
"r_y3": 528.2,
"coord_origin": "TOPLEFT"
},
"text": "Advances in Neural Informa-",
"orig": "Advances in Neural Informa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 546.9,
"r_x1": 425.7,
"r_y1": 546.9,
"r_x2": 425.7,
"r_y2": 539.2,
"r_x3": 328.8,
"r_y3": 539.2,
"coord_origin": "TOPLEFT"
},
"text": "tion Processing Systems 32",
"orig": "tion Processing Systems 32",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 425.7,
"r_y0": 547.1,
"r_x1": 545.1,
"r_y1": 547.1,
"r_x2": 545.1,
"r_y2": 539.1,
"r_x3": 425.7,
"r_y3": 539.1,
"coord_origin": "TOPLEFT"
},
"text": ", pages 8024-8035. Curran Asso-",
"orig": ", pages 8024-8035. Curran Asso-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 558.1,
"r_x1": 399.7,
"r_y1": 558.1,
"r_x2": 399.7,
"r_y2": 550.0,
"r_x3": 328.8,
"r_y3": 550.0,
"coord_origin": "TOPLEFT"
},
"text": "ciates, Inc., 2019. 6",
"orig": "ciates, Inc., 2019. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[22] Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer, James Bradbury, Gregory Chanan, Trevor Killeen, Zeming Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison, Andreas Kopf, Edward Yang, Zachary DeVito, Martin Raison, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner, Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An imperative style, high-performance deep learning library. In H. Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E. Fox, and R. Garnett, editors, Advances in Neural Information Processing Systems 32 , pages 8024-8035. Curran Associates, Inc., 2019. 6"
},
{
"label": "list_item",
"id": 19,
"page_no": 8,
"cluster": {
"id": 19,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 561.5,
"r": 545.1,
"b": 624.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 569.5,
"r_x1": 324.5,
"r_y1": 569.5,
"r_x2": 324.5,
"r_y2": 561.5,
"r_x3": 308.9,
"r_y3": 561.5,
"coord_origin": "TOPLEFT"
},
"text": "[23]",
"orig": "[23]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.9,
"r_y0": 569.5,
"r_x1": 545.1,
"r_y1": 569.5,
"r_x2": 545.1,
"r_y2": 561.5,
"r_x3": 326.9,
"r_y3": 561.5,
"coord_origin": "TOPLEFT"
},
"text": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish",
"orig": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 580.5,
"r_x1": 545.1,
"r_y1": 580.5,
"r_x2": 545.1,
"r_y2": 572.4,
"r_x3": 328.8,
"r_y3": 572.4,
"coord_origin": "TOPLEFT"
},
"text": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach",
"orig": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 591.4,
"r_x1": 545.1,
"r_y1": 591.4,
"r_x2": 545.1,
"r_y2": 583.4,
"r_x3": 328.8,
"r_y3": 583.4,
"coord_origin": "TOPLEFT"
},
"text": "for end to end table detection and structure recognition from",
"orig": "for end to end table detection and structure recognition from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 602.4,
"r_x1": 431.6,
"r_y1": 602.4,
"r_x2": 431.6,
"r_y2": 594.4,
"r_x3": 328.8,
"r_y3": 594.4,
"coord_origin": "TOPLEFT"
},
"text": "image-based documents. In",
"orig": "image-based documents. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 434.7,
"r_y0": 602.2,
"r_x1": 545.1,
"r_y1": 602.2,
"r_x2": 545.1,
"r_y2": 594.4,
"r_x3": 434.7,
"r_y3": 594.4,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF",
"orig": "Proceedings of the IEEE/CVF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 613.1,
"r_x1": 545.1,
"r_y1": 613.1,
"r_x2": 545.1,
"r_y2": 605.4,
"r_x3": 328.8,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision and Pattern Recognition",
"orig": "Conference on Computer Vision and Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 624.1,
"r_x1": 367.8,
"r_y1": 624.1,
"r_x2": 367.8,
"r_y2": 616.4,
"r_x3": 328.8,
"r_y3": 616.4,
"coord_origin": "TOPLEFT"
},
"text": "Workshops",
"orig": "Workshops",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.8,
"r_y0": 624.3,
"r_x1": 458.7,
"r_y1": 624.3,
"r_x2": 458.7,
"r_y2": 616.3,
"r_x3": 367.8,
"r_y3": 616.3,
"coord_origin": "TOPLEFT"
},
"text": ", pages 572-573, 2020. 1",
"orig": ", pages 572-573, 2020. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[23] Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish Visave, and Kavita Sultanpure. Cascadetabnet: An approach for end to end table detection and structure recognition from image-based documents. In Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition Workshops , pages 572-573, 2020. 1"
},
{
"label": "list_item",
"id": 23,
"page_no": 8,
"cluster": {
"id": 23,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 627.7,
"r": 545.1,
"b": 668.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 635.7,
"r_x1": 324.7,
"r_y1": 635.7,
"r_x2": 324.7,
"r_y2": 627.7,
"r_x3": 308.9,
"r_y3": 627.7,
"coord_origin": "TOPLEFT"
},
"text": "[24]",
"orig": "[24]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.1,
"r_y0": 635.7,
"r_x1": 545.1,
"r_y1": 635.7,
"r_x2": 545.1,
"r_y2": 627.7,
"r_x3": 327.1,
"r_y3": 627.7,
"coord_origin": "TOPLEFT"
},
"text": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.",
"orig": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 646.7,
"r_x1": 545.1,
"r_y1": 646.7,
"r_x2": 545.1,
"r_y2": 638.7,
"r_x3": 328.8,
"r_y3": 638.7,
"coord_origin": "TOPLEFT"
},
"text": "Rethinking table recognition using graph neural networks.",
"orig": "Rethinking table recognition using graph neural networks.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 657.7,
"r_x1": 336.3,
"r_y1": 657.7,
"r_x2": 336.3,
"r_y2": 649.6,
"r_x3": 328.8,
"r_y3": 649.6,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 338.1,
"r_y0": 657.4,
"r_x1": 545.1,
"r_y1": 657.4,
"r_x2": 545.1,
"r_y2": 649.7,
"r_x3": 338.1,
"r_y3": 649.7,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 668.4,
"r_x1": 406.3,
"r_y1": 668.4,
"r_x2": 406.3,
"r_y2": 660.7,
"r_x3": 328.8,
"r_y3": 660.7,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.3,
"r_y0": 668.6,
"r_x1": 521.1,
"r_y1": 668.6,
"r_x2": 521.1,
"r_y2": 660.6,
"r_x3": 406.3,
"r_y3": 660.6,
"coord_origin": "TOPLEFT"
},
"text": ", pages 142-147. IEEE, 2019. 3",
"orig": ", pages 142-147. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[24] Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait. Rethinking table recognition using graph neural networks. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 142-147. IEEE, 2019. 3"
},
{
"label": "list_item",
"id": 24,
"page_no": 8,
"cluster": {
"id": 24,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 672.0,
"r": 545.1,
"b": 712.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.87,
"cells": [
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 680.1,
"r_x1": 324.7,
"r_y1": 680.1,
"r_x2": 324.7,
"r_y2": 672.0,
"r_x3": 308.9,
"r_y3": 672.0,
"coord_origin": "TOPLEFT"
},
"text": "[25]",
"orig": "[25]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.1,
"r_y0": 680.1,
"r_x1": 545.1,
"r_y1": 680.1,
"r_x2": 545.1,
"r_y2": 672.0,
"r_x3": 327.1,
"r_y3": 672.0,
"coord_origin": "TOPLEFT"
},
"text": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir",
"orig": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 691.0,
"r_x1": 482.8,
"r_y1": 691.0,
"r_x2": 482.8,
"r_y2": 683.0,
"r_x3": 328.8,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Sadeghian, Ian Reid, and Silvio Savarese.",
"orig": "Sadeghian, Ian Reid, and Silvio Savarese.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.8,
"r_y0": 691.0,
"r_x1": 545.1,
"r_y1": 691.0,
"r_x2": 545.1,
"r_y2": 683.0,
"r_x3": 488.8,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Generalized in-",
"orig": "Generalized in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 702.0,
"r_x1": 545.1,
"r_y1": 702.0,
"r_x2": 545.1,
"r_y2": 694.0,
"r_x3": 328.8,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "tersection over union: A metric and a loss for bounding box",
"orig": "tersection over union: A metric and a loss for bounding box",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 712.9,
"r_x1": 379.2,
"r_y1": 712.9,
"r_x2": 379.2,
"r_y2": 704.9,
"r_x3": 328.8,
"r_y3": 704.9,
"coord_origin": "TOPLEFT"
},
"text": "regression. In",
"orig": "regression. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 381.6,
"r_y0": 712.7,
"r_x1": 545.1,
"r_y1": 712.7,
"r_x2": 545.1,
"r_y2": 705.0,
"r_x3": 381.6,
"r_y3": 705.0,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF Conference on",
"orig": "Proceedings of the IEEE/CVF Conference on",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[25] Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir Sadeghian, Ian Reid, and Silvio Savarese. Generalized intersection over union: A metric and a loss for bounding box regression. In Proceedings of the IEEE/CVF Conference on"
},
{
"label": "page_footer",
"id": 22,
"page_no": 8,
"cluster": {
"id": 22,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9"
}
],
"body": [
{
"label": "list_item",
"id": 25,
"page_no": 8,
"cluster": {
"id": 25,
"label": "list_item",
"bbox": {
"l": 70.0,
"t": 75.9,
"r": 286.4,
"b": 116.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.73,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 83.9,
"r_x1": 286.4,
"r_y1": 83.9,
"r_x2": 286.4,
"r_y2": 75.9,
"r_x3": 70.0,
"r_y3": 75.9,
"coord_origin": "TOPLEFT"
},
"text": "end object detection with transformers. In Andrea Vedaldi,",
"orig": "end object detection with transformers. In Andrea Vedaldi,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 94.9,
"r_x1": 286.4,
"r_y1": 94.9,
"r_x2": 286.4,
"r_y2": 86.8,
"r_x3": 70.0,
"r_y3": 86.8,
"coord_origin": "TOPLEFT"
},
"text": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-",
"orig": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 105.8,
"r_x1": 85.7,
"r_y1": 105.8,
"r_x2": 85.7,
"r_y2": 97.8,
"r_x3": 70.0,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "tors,",
"orig": "tors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 87.9,
"r_y0": 105.6,
"r_x1": 199.9,
"r_y1": 105.6,
"r_x2": 199.9,
"r_y2": 97.9,
"r_x3": 87.9,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision - ECCV 2020",
"orig": "Computer Vision - ECCV 2020",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 199.9,
"r_y0": 105.8,
"r_x1": 286.4,
"r_y1": 105.8,
"r_x2": 286.4,
"r_y2": 97.8,
"r_x3": 199.9,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 213-229, Cham,",
"orig": ", pages 213-229, Cham,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 116.8,
"r_x1": 221.9,
"r_y1": 116.8,
"r_x2": 221.9,
"r_y2": 108.8,
"r_x3": 70.0,
"r_y3": 108.8,
"coord_origin": "TOPLEFT"
},
"text": "2020. Springer International Publishing. 5",
"orig": "2020. Springer International Publishing. 5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "end object detection with transformers. In Andrea Vedaldi, Horst Bischof, Thomas Brox, and Jan-Michael Frahm, editors, Computer Vision - ECCV 2020 , pages 213-229, Cham, 2020. Springer International Publishing. 5"
},
{
"label": "list_item",
"id": 9,
"page_no": 8,
"cluster": {
"id": 9,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 120.0,
"r": 286.4,
"b": 150.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 128.0,
"r_x1": 65.2,
"r_y1": 128.0,
"r_x2": 65.2,
"r_y2": 120.0,
"r_x3": 54.6,
"r_y3": 120.0,
"coord_origin": "TOPLEFT"
},
"text": "[2]",
"orig": "[2]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.5,
"r_y0": 128.0,
"r_x1": 286.4,
"r_y1": 128.0,
"r_x2": 286.4,
"r_y2": 120.0,
"r_x3": 67.5,
"r_y3": 120.0,
"coord_origin": "TOPLEFT"
},
"text": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-",
"orig": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 139.0,
"r_x1": 179.7,
"r_y1": 139.0,
"r_x2": 179.7,
"r_y2": 131.0,
"r_x3": 70.0,
"r_y3": 131.0,
"coord_origin": "TOPLEFT"
},
"text": "uan Yin, and Xian-Ling Mao.",
"orig": "uan Yin, and Xian-Ling Mao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.6,
"r_y0": 139.0,
"r_x1": 286.4,
"r_y1": 139.0,
"r_x2": 286.4,
"r_y2": 131.0,
"r_x3": 185.6,
"r_y3": 131.0,
"coord_origin": "TOPLEFT"
},
"text": "Complicated table structure",
"orig": "Complicated table structure",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 150.0,
"r_x1": 113.1,
"r_y1": 150.0,
"r_x2": 113.1,
"r_y2": 141.9,
"r_x3": 70.0,
"r_y3": 141.9,
"coord_origin": "TOPLEFT"
},
"text": "recognition.",
"orig": "recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.3,
"r_y0": 149.8,
"r_x1": 235.3,
"r_y1": 149.8,
"r_x2": 235.3,
"r_y2": 142.0,
"r_x3": 116.3,
"r_y3": 142.0,
"coord_origin": "TOPLEFT"
},
"text": "arXiv preprint arXiv:1908.04729",
"orig": "arXiv preprint arXiv:1908.04729",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 235.3,
"r_y0": 150.0,
"r_x1": 267.7,
"r_y1": 150.0,
"r_x2": 267.7,
"r_y2": 141.9,
"r_x3": 235.3,
"r_y3": 141.9,
"coord_origin": "TOPLEFT"
},
"text": ", 2019. 3",
"orig": ", 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[2] Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanxuan Yin, and Xian-Ling Mao. Complicated table structure recognition. arXiv preprint arXiv:1908.04729 , 2019. 3"
},
{
"label": "list_item",
"id": 7,
"page_no": 8,
"cluster": {
"id": 7,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 153.2,
"r": 286.4,
"b": 183.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 161.2,
"r_x1": 65.1,
"r_y1": 161.2,
"r_x2": 65.1,
"r_y2": 153.2,
"r_x3": 54.6,
"r_y3": 153.2,
"coord_origin": "TOPLEFT"
},
"text": "[3]",
"orig": "[3]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.4,
"r_y0": 161.2,
"r_x1": 218.8,
"r_y1": 161.2,
"r_x2": 218.8,
"r_y2": 153.2,
"r_x3": 67.4,
"r_y3": 153.2,
"coord_origin": "TOPLEFT"
},
"text": "Bertrand Couasnon and Aurelie Lemaitre.",
"orig": "Bertrand Couasnon and Aurelie Lemaitre.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 221.0,
"r_y0": 161.0,
"r_x1": 286.4,
"r_y1": 161.0,
"r_x2": 286.4,
"r_y2": 153.3,
"r_x3": 221.0,
"r_y3": 153.3,
"coord_origin": "TOPLEFT"
},
"text": "Recognition of Ta-",
"orig": "Recognition of Ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 172.0,
"r_x1": 125.3,
"r_y1": 172.0,
"r_x2": 125.3,
"r_y2": 164.3,
"r_x3": 70.0,
"r_y3": 164.3,
"coord_origin": "TOPLEFT"
},
"text": "bles and Forms",
"orig": "bles and Forms",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.3,
"r_y0": 172.2,
"r_x1": 286.4,
"r_y1": 172.2,
"r_x2": 286.4,
"r_y2": 164.2,
"r_x3": 125.3,
"r_y3": 164.2,
"coord_origin": "TOPLEFT"
},
"text": ", pages 647-677. Springer London, London,",
"orig": ", pages 647-677. Springer London, London,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 183.2,
"r_x1": 97.9,
"r_y1": 183.2,
"r_x2": 97.9,
"r_y2": 175.1,
"r_x3": 70.0,
"r_y3": 175.1,
"coord_origin": "TOPLEFT"
},
"text": "2014. 2",
"orig": "2014. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[3] Bertrand Couasnon and Aurelie Lemaitre. Recognition of Tables and Forms , pages 647-677. Springer London, London, 2014. 2"
},
{
"label": "list_item",
"id": 0,
"page_no": 8,
"cluster": {
"id": 0,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 186.4,
"r": 286.4,
"b": 227.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 194.4,
"r_x1": 65.8,
"r_y1": 194.4,
"r_x2": 65.8,
"r_y2": 186.4,
"r_x3": 54.6,
"r_y3": 186.4,
"coord_origin": "TOPLEFT"
},
"text": "[4]",
"orig": "[4]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.2,
"r_y0": 194.4,
"r_x1": 286.4,
"r_y1": 194.4,
"r_x2": 286.4,
"r_y2": 186.4,
"r_x3": 68.2,
"r_y3": 186.4,
"coord_origin": "TOPLEFT"
},
"text": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun",
"orig": "Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 205.4,
"r_x1": 286.4,
"r_y1": 205.4,
"r_x2": 286.4,
"r_y2": 197.4,
"r_x3": 70.0,
"r_y3": 197.4,
"coord_origin": "TOPLEFT"
},
"text": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-",
"orig": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. IC-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 216.3,
"r_x1": 286.4,
"r_y1": 216.3,
"r_x2": 286.4,
"r_y2": 208.3,
"r_x3": 70.0,
"r_y3": 208.3,
"coord_origin": "TOPLEFT"
},
"text": "DAR 2019 Competition on Table Detection and Recognition",
"orig": "DAR 2019 Competition on Table Detection and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 227.3,
"r_x1": 245.8,
"r_y1": 227.3,
"r_x2": 245.8,
"r_y2": 219.3,
"r_x3": 70.0,
"r_y3": 219.3,
"coord_origin": "TOPLEFT"
},
"text": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2",
"orig": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[4] Herv\u00b4e D\u00b4ejean, Jean-Luc Meunier, Liangcai Gao, Yilun Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. ICDAR 2019 Competition on Table Detection and Recognition (cTDaR), Apr. 2019. http://sac.founderit.com/. 2"
},
{
"label": "list_item",
"id": 1,
"page_no": 8,
"cluster": {
"id": 1,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 230.6,
"r": 286.4,
"b": 271.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 238.6,
"r_x1": 65.4,
"r_y1": 238.6,
"r_x2": 65.4,
"r_y2": 230.6,
"r_x3": 54.6,
"r_y3": 230.6,
"coord_origin": "TOPLEFT"
},
"text": "[5]",
"orig": "[5]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.7,
"r_y0": 238.6,
"r_x1": 286.4,
"r_y1": 238.6,
"r_x2": 286.4,
"r_y2": 230.6,
"r_x3": 67.7,
"r_y3": 230.6,
"coord_origin": "TOPLEFT"
},
"text": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and",
"orig": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 249.5,
"r_x1": 286.4,
"r_y1": 249.5,
"r_x2": 286.4,
"r_y2": 241.5,
"r_x3": 70.0,
"r_y3": 241.5,
"coord_origin": "TOPLEFT"
},
"text": "Stavros J Perantonis. Automatic table detection in document",
"orig": "Stavros J Perantonis. Automatic table detection in document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 260.5,
"r_x1": 108.4,
"r_y1": 260.5,
"r_x2": 108.4,
"r_y2": 252.5,
"r_x3": 70.0,
"r_y3": 252.5,
"coord_origin": "TOPLEFT"
},
"text": "images. In",
"orig": "images. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.6,
"r_y0": 260.3,
"r_x1": 286.4,
"r_y1": 260.3,
"r_x2": 286.4,
"r_y2": 252.6,
"r_x3": 110.6,
"r_y3": 252.6,
"coord_origin": "TOPLEFT"
},
"text": "International Conference on Pattern Recognition",
"orig": "International Conference on Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 271.2,
"r_x1": 140.6,
"r_y1": 271.2,
"r_x2": 140.6,
"r_y2": 263.5,
"r_x3": 70.0,
"r_y3": 263.5,
"coord_origin": "TOPLEFT"
},
"text": "and Image Analysis",
"orig": "and Image Analysis",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.6,
"r_y0": 271.5,
"r_x1": 266.5,
"r_y1": 271.5,
"r_x2": 266.5,
"r_y2": 263.4,
"r_x3": 140.6,
"r_y3": 263.4,
"coord_origin": "TOPLEFT"
},
"text": ", pages 609-618. Springer, 2005. 2",
"orig": ", pages 609-618. Springer, 2005. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[5] Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and Stavros J Perantonis. Automatic table detection in document images. In International Conference on Pattern Recognition and Image Analysis , pages 609-618. Springer, 2005. 2"
},
{
"label": "list_item",
"id": 2,
"page_no": 8,
"cluster": {
"id": 2,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 274.7,
"r": 286.4,
"b": 315.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 282.7,
"r_x1": 64.8,
"r_y1": 282.7,
"r_x2": 64.8,
"r_y2": 274.7,
"r_x3": 54.6,
"r_y3": 274.7,
"coord_origin": "TOPLEFT"
},
"text": "[6]",
"orig": "[6]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.0,
"r_y0": 282.7,
"r_x1": 286.4,
"r_y1": 282.7,
"r_x2": 286.4,
"r_y2": 274.7,
"r_x3": 67.0,
"r_y3": 274.7,
"coord_origin": "TOPLEFT"
},
"text": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.",
"orig": "Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 293.7,
"r_x1": 179.6,
"r_y1": 293.7,
"r_x2": 179.6,
"r_y2": 285.7,
"r_x3": 70.0,
"r_y3": 285.7,
"coord_origin": "TOPLEFT"
},
"text": "Icdar 2013 table competition.",
"orig": "Icdar 2013 table competition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.0,
"r_y0": 293.7,
"r_x1": 194.5,
"r_y1": 293.7,
"r_x2": 194.5,
"r_y2": 285.7,
"r_x3": 187.0,
"r_y3": 285.7,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 198.0,
"r_y0": 293.5,
"r_x1": 286.4,
"r_y1": 293.5,
"r_x2": 286.4,
"r_y2": 285.7,
"r_x3": 198.0,
"r_y3": 285.7,
"coord_origin": "TOPLEFT"
},
"text": "2013 12th International",
"orig": "2013 12th International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 304.4,
"r_x1": 260.2,
"r_y1": 304.4,
"r_x2": 260.2,
"r_y2": 296.7,
"r_x3": 70.0,
"r_y3": 296.7,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Document Analysis and Recognition",
"orig": "Conference on Document Analysis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 260.2,
"r_y0": 304.6,
"r_x1": 286.4,
"r_y1": 304.6,
"r_x2": 286.4,
"r_y2": 296.6,
"r_x3": 260.2,
"r_y3": 296.6,
"coord_origin": "TOPLEFT"
},
"text": ", pages",
"orig": ", pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 315.6,
"r_x1": 142.7,
"r_y1": 315.6,
"r_x2": 142.7,
"r_y2": 307.6,
"r_x3": 70.0,
"r_y3": 307.6,
"coord_origin": "TOPLEFT"
},
"text": "1449-1453, 2013. 2",
"orig": "1449-1453, 2013. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[6] Max G\u00a8obel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi. Icdar 2013 table competition. In 2013 12th International Conference on Document Analysis and Recognition , pages 1449-1453, 2013. 2"
},
{
"label": "list_item",
"id": 4,
"page_no": 8,
"cluster": {
"id": 4,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 318.9,
"r": 286.4,
"b": 348.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 326.9,
"r_x1": 65.6,
"r_y1": 326.9,
"r_x2": 65.6,
"r_y2": 318.9,
"r_x3": 54.6,
"r_y3": 318.9,
"coord_origin": "TOPLEFT"
},
"text": "[7]",
"orig": "[7]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.0,
"r_y0": 326.9,
"r_x1": 199.5,
"r_y1": 326.9,
"r_x2": 199.5,
"r_y2": 318.9,
"r_x3": 68.0,
"r_y3": 318.9,
"coord_origin": "TOPLEFT"
},
"text": "EA Green and M Krishnamoorthy.",
"orig": "EA Green and M Krishnamoorthy.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 207.0,
"r_y0": 326.9,
"r_x1": 286.4,
"r_y1": 326.9,
"r_x2": 286.4,
"r_y2": 318.9,
"r_x3": 207.0,
"r_y3": 318.9,
"coord_origin": "TOPLEFT"
},
"text": "Recognition of tables",
"orig": "Recognition of tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 337.8,
"r_x1": 176.3,
"r_y1": 337.8,
"r_x2": 176.3,
"r_y2": 329.8,
"r_x3": 70.0,
"r_y3": 329.8,
"coord_origin": "TOPLEFT"
},
"text": "using table grammars. procs.",
"orig": "using table grammars. procs.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 182.6,
"r_y0": 337.8,
"r_x1": 190.1,
"r_y1": 337.8,
"r_x2": 190.1,
"r_y2": 329.8,
"r_x3": 182.6,
"r_y3": 329.8,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 193.3,
"r_y0": 337.6,
"r_x1": 286.4,
"r_y1": 337.6,
"r_x2": 286.4,
"r_y2": 329.9,
"r_x3": 193.3,
"r_y3": 329.9,
"coord_origin": "TOPLEFT"
},
"text": "Symposium on Document",
"orig": "Symposium on Document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 348.6,
"r_x1": 206.3,
"r_y1": 348.6,
"r_x2": 206.3,
"r_y2": 340.9,
"r_x3": 70.0,
"r_y3": 340.9,
"coord_origin": "TOPLEFT"
},
"text": "Analysis and Recognition (SDAIR\u201995)",
"orig": "Analysis and Recognition (SDAIR\u201995)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.3,
"r_y0": 348.8,
"r_x1": 274.8,
"r_y1": 348.8,
"r_x2": 274.8,
"r_y2": 340.8,
"r_x3": 206.3,
"r_y3": 340.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 261-277. 2",
"orig": ", pages 261-277. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[7] EA Green and M Krishnamoorthy. Recognition of tables using table grammars. procs. In Symposium on Document Analysis and Recognition (SDAIR'95) , pages 261-277. 2"
},
{
"label": "list_item",
"id": 3,
"page_no": 8,
"cluster": {
"id": 3,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 352.0,
"r": 286.4,
"b": 403.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 360.1,
"r_x1": 65.0,
"r_y1": 360.1,
"r_x2": 65.0,
"r_y2": 352.0,
"r_x3": 54.6,
"r_y3": 352.0,
"coord_origin": "TOPLEFT"
},
"text": "[8]",
"orig": "[8]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.3,
"r_y0": 360.1,
"r_x1": 286.4,
"r_y1": 360.1,
"r_x2": 286.4,
"r_y2": 352.0,
"r_x3": 67.3,
"r_y3": 352.0,
"coord_origin": "TOPLEFT"
},
"text": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-",
"orig": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 371.0,
"r_x1": 234.1,
"r_y1": 371.0,
"r_x2": 234.1,
"r_y2": 363.0,
"r_x3": 70.0,
"r_y3": 363.0,
"coord_origin": "TOPLEFT"
},
"text": "dier Stricker, and Muhammad Zeshan Afzal.",
"orig": "dier Stricker, and Muhammad Zeshan Afzal.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 240.1,
"r_y0": 371.0,
"r_x1": 286.4,
"r_y1": 371.0,
"r_x2": 286.4,
"r_y2": 363.0,
"r_x3": 240.1,
"r_y3": 363.0,
"coord_origin": "TOPLEFT"
},
"text": "Castabdetec-",
"orig": "Castabdetec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 382.0,
"r_x1": 286.4,
"r_y1": 382.0,
"r_x2": 286.4,
"r_y2": 374.0,
"r_x3": 70.0,
"r_y3": 374.0,
"coord_origin": "TOPLEFT"
},
"text": "tors: Cascade network for table detection in document im-",
"orig": "tors: Cascade network for table detection in document im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 392.9,
"r_x1": 286.4,
"r_y1": 392.9,
"r_x2": 286.4,
"r_y2": 384.9,
"r_x3": 70.0,
"r_y3": 384.9,
"coord_origin": "TOPLEFT"
},
"text": "ages with recursive feature pyramid and switchable atrous",
"orig": "ages with recursive feature pyramid and switchable atrous",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 403.9,
"r_x1": 114.6,
"r_y1": 403.9,
"r_x2": 114.6,
"r_y2": 395.9,
"r_x3": 70.0,
"r_y3": 395.9,
"coord_origin": "TOPLEFT"
},
"text": "convolution.",
"orig": "convolution.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 117.8,
"r_y0": 403.7,
"r_x1": 186.7,
"r_y1": 403.7,
"r_x2": 186.7,
"r_y2": 396.0,
"r_x3": 117.8,
"r_y3": 396.0,
"coord_origin": "TOPLEFT"
},
"text": "Journal of Imaging",
"orig": "Journal of Imaging",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 186.7,
"r_y0": 403.9,
"r_x1": 243.0,
"r_y1": 403.9,
"r_x2": 243.0,
"r_y2": 395.9,
"r_x3": 186.7,
"r_y3": 395.9,
"coord_origin": "TOPLEFT"
},
"text": ", 7(10), 2021. 1",
"orig": ", 7(10), 2021. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[8] Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Didier Stricker, and Muhammad Zeshan Afzal. Castabdetectors: Cascade network for table detection in document images with recursive feature pyramid and switchable atrous convolution. Journal of Imaging , 7(10), 2021. 1"
},
{
"label": "list_item",
"id": 10,
"page_no": 8,
"cluster": {
"id": 10,
"label": "list_item",
"bbox": {
"l": 54.6,
"t": 407.2,
"r": 286.4,
"b": 437.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 415.2,
"r_x1": 65.3,
"r_y1": 415.2,
"r_x2": 65.3,
"r_y2": 407.2,
"r_x3": 54.6,
"r_y3": 407.2,
"coord_origin": "TOPLEFT"
},
"text": "[9]",
"orig": "[9]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.6,
"r_y0": 415.2,
"r_x1": 286.4,
"r_y1": 415.2,
"r_x2": 286.4,
"r_y2": 407.2,
"r_x3": 67.6,
"r_y3": 407.2,
"coord_origin": "TOPLEFT"
},
"text": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-",
"orig": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 426.1,
"r_x1": 147.1,
"r_y1": 426.1,
"r_x2": 147.1,
"r_y2": 418.1,
"r_x3": 70.0,
"r_y3": 418.1,
"coord_origin": "TOPLEFT"
},
"text": "shick. Mask r-cnn. In",
"orig": "shick. Mask r-cnn. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 149.2,
"r_y0": 425.9,
"r_x1": 286.4,
"r_y1": 425.9,
"r_x2": 286.4,
"r_y2": 418.2,
"r_x3": 149.2,
"r_y3": 418.2,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE International",
"orig": "Proceedings of the IEEE International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 436.9,
"r_x1": 213.5,
"r_y1": 436.9,
"r_x2": 213.5,
"r_y2": 429.2,
"r_x3": 70.0,
"r_y3": 429.2,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision (ICCV)",
"orig": "Conference on Computer Vision (ICCV)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 213.5,
"r_y0": 437.1,
"r_x1": 261.0,
"r_y1": 437.1,
"r_x2": 261.0,
"r_y2": 429.1,
"r_x3": 213.5,
"r_y3": 429.1,
"coord_origin": "TOPLEFT"
},
"text": ", Oct 2017. 1",
"orig": ", Oct 2017. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[9] Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Girshick. Mask r-cnn. In Proceedings of the IEEE International Conference on Computer Vision (ICCV) , Oct 2017. 1"
},
{
"label": "list_item",
"id": 14,
"page_no": 8,
"cluster": {
"id": 14,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 440.3,
"r": 286.4,
"b": 481.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 448.4,
"r_x1": 65.4,
"r_y1": 448.4,
"r_x2": 65.4,
"r_y2": 440.3,
"r_x3": 50.1,
"r_y3": 440.3,
"coord_origin": "TOPLEFT"
},
"text": "[10]",
"orig": "[10]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.7,
"r_y0": 448.4,
"r_x1": 286.4,
"r_y1": 448.4,
"r_x2": 286.4,
"r_y2": 440.3,
"r_x3": 67.7,
"r_y3": 440.3,
"coord_origin": "TOPLEFT"
},
"text": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-",
"orig": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 459.3,
"r_x1": 202.7,
"r_y1": 459.3,
"r_x2": 202.7,
"r_y2": 451.3,
"r_x3": 70.0,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": "cong Li, Xin Tang, and Rong Xiao.",
"orig": "cong Li, Xin Tang, and Rong Xiao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 209.0,
"r_y0": 459.3,
"r_x1": 286.4,
"r_y1": 459.3,
"r_x2": 286.4,
"r_y2": 451.3,
"r_x3": 209.0,
"r_y3": 451.3,
"coord_origin": "TOPLEFT"
},
"text": "Pingan-vcgroup\u2019s so-",
"orig": "Pingan-vcgroup\u2019s so-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 470.3,
"r_x1": 286.4,
"r_y1": 470.3,
"r_x2": 286.4,
"r_y2": 462.3,
"r_x3": 70.0,
"r_y3": 462.3,
"coord_origin": "TOPLEFT"
},
"text": "lution for icdar 2021 competition on scientific table image",
"orig": "lution for icdar 2021 competition on scientific table image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 481.2,
"r_x1": 141.9,
"r_y1": 481.2,
"r_x2": 141.9,
"r_y2": 473.2,
"r_x3": 70.0,
"r_y3": 473.2,
"coord_origin": "TOPLEFT"
},
"text": "recognition to latex.",
"orig": "recognition to latex.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 145.1,
"r_y0": 481.0,
"r_x1": 166.0,
"r_y1": 481.0,
"r_x2": 166.0,
"r_y2": 473.3,
"r_x3": 145.1,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "ArXiv",
"orig": "ArXiv",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 166.0,
"r_y0": 481.2,
"r_x1": 259.9,
"r_y1": 481.2,
"r_x2": 259.9,
"r_y2": 473.2,
"r_x3": 166.0,
"r_y3": 473.2,
"coord_origin": "TOPLEFT"
},
"text": ", abs/2105.01846, 2021. 2",
"orig": ", abs/2105.01846, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[10] Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bingcong Li, Xin Tang, and Rong Xiao. Pingan-vcgroup's solution for icdar 2021 competition on scientific table image recognition to latex. ArXiv , abs/2105.01846, 2021. 2"
},
{
"label": "list_item",
"id": 11,
"page_no": 8,
"cluster": {
"id": 11,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 484.5,
"r": 286.4,
"b": 536.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 492.5,
"r_x1": 66.0,
"r_y1": 492.5,
"r_x2": 66.0,
"r_y2": 484.5,
"r_x3": 50.1,
"r_y3": 484.5,
"coord_origin": "TOPLEFT"
},
"text": "[11]",
"orig": "[11]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.4,
"r_y0": 492.5,
"r_x1": 286.4,
"r_y1": 492.5,
"r_x2": 286.4,
"r_y2": 484.5,
"r_x3": 68.4,
"r_y3": 484.5,
"coord_origin": "TOPLEFT"
},
"text": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and",
"orig": "Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 503.5,
"r_x1": 286.4,
"r_y1": 503.5,
"r_x2": 286.4,
"r_y2": 495.4,
"r_x3": 70.0,
"r_y3": 495.4,
"coord_origin": "TOPLEFT"
},
"text": "Gordon Wilfong. Medium-independent table detection. In",
"orig": "Gordon Wilfong. Medium-independent table detection. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 514.2,
"r_x1": 227.4,
"r_y1": 514.2,
"r_x2": 227.4,
"r_y2": 506.5,
"r_x3": 70.0,
"r_y3": 506.5,
"coord_origin": "TOPLEFT"
},
"text": "Document Recognition and Retrieval VII",
"orig": "Document Recognition and Retrieval VII",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.4,
"r_y0": 514.4,
"r_x1": 286.4,
"r_y1": 514.4,
"r_x2": 286.4,
"r_y2": 506.4,
"r_x3": 227.4,
"r_y3": 506.4,
"coord_origin": "TOPLEFT"
},
"text": ", volume 3967,",
"orig": ", volume 3967,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 525.4,
"r_x1": 286.4,
"r_y1": 525.4,
"r_x2": 286.4,
"r_y2": 517.4,
"r_x3": 70.0,
"r_y3": 517.4,
"coord_origin": "TOPLEFT"
},
"text": "pages 291-302. International Society for Optics and Photon-",
"orig": "pages 291-302. International Society for Optics and Photon-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 536.3,
"r_x1": 112.4,
"r_y1": 536.3,
"r_x2": 112.4,
"r_y2": 528.3,
"r_x3": 70.0,
"r_y3": 528.3,
"coord_origin": "TOPLEFT"
},
"text": "ics, 1999. 2",
"orig": "ics, 1999. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[11] Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and Gordon Wilfong. Medium-independent table detection. In Document Recognition and Retrieval VII , volume 3967, pages 291-302. International Society for Optics and Photonics, 1999. 2"
},
{
"label": "list_item",
"id": 5,
"page_no": 8,
"cluster": {
"id": 5,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 539.6,
"r": 286.4,
"b": 591.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 547.6,
"r_x1": 65.5,
"r_y1": 547.6,
"r_x2": 65.5,
"r_y2": 539.6,
"r_x3": 50.1,
"r_y3": 539.6,
"coord_origin": "TOPLEFT"
},
"text": "[12]",
"orig": "[12]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 547.6,
"r_x1": 286.4,
"r_y1": 547.6,
"r_x2": 286.4,
"r_y2": 539.6,
"r_x3": 67.8,
"r_y3": 539.6,
"coord_origin": "TOPLEFT"
},
"text": "Matthew Hurst. A constraint-based approach to table struc-",
"orig": "Matthew Hurst. A constraint-based approach to table struc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 558.6,
"r_x1": 136.3,
"r_y1": 558.6,
"r_x2": 136.3,
"r_y2": 550.6,
"r_x3": 70.0,
"r_y3": 550.6,
"coord_origin": "TOPLEFT"
},
"text": "ture derivation. In",
"orig": "ture derivation. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.8,
"r_y0": 558.4,
"r_x1": 286.4,
"r_y1": 558.4,
"r_x2": 286.4,
"r_y2": 550.6,
"r_x3": 138.8,
"r_y3": 550.6,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the Seventh International",
"orig": "Proceedings of the Seventh International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 569.3,
"r_x1": 286.4,
"r_y1": 569.3,
"r_x2": 286.4,
"r_y2": 561.6,
"r_x3": 70.0,
"r_y3": 561.6,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Document Analysis and Recognition - Volume",
"orig": "Conference on Document Analysis and Recognition - Volume",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 580.3,
"r_x1": 74.5,
"r_y1": 580.3,
"r_x2": 74.5,
"r_y2": 572.6,
"r_x3": 70.0,
"r_y3": 572.6,
"coord_origin": "TOPLEFT"
},
"text": "2",
"orig": "2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 74.5,
"r_y0": 580.5,
"r_x1": 286.4,
"r_y1": 580.5,
"r_x2": 286.4,
"r_y2": 572.5,
"r_x3": 74.5,
"r_y3": 572.5,
"coord_origin": "TOPLEFT"
},
"text": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-",
"orig": ", ICDAR \u201903, page 911, USA, 2003. IEEE Computer Soci-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 591.4,
"r_x1": 90.4,
"r_y1": 591.4,
"r_x2": 90.4,
"r_y2": 583.4,
"r_x3": 70.0,
"r_y3": 583.4,
"coord_origin": "TOPLEFT"
},
"text": "ety. 2",
"orig": "ety. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[12] Matthew Hurst. A constraint-based approach to table structure derivation. In Proceedings of the Seventh International Conference on Document Analysis and Recognition - Volume 2 , ICDAR '03, page 911, USA, 2003. IEEE Computer Society. 2"
},
{
"label": "list_item",
"id": 13,
"page_no": 8,
"cluster": {
"id": 13,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 594.7,
"r": 286.4,
"b": 646.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 602.7,
"r_x1": 66.3,
"r_y1": 602.7,
"r_x2": 66.3,
"r_y2": 594.7,
"r_x3": 50.1,
"r_y3": 594.7,
"coord_origin": "TOPLEFT"
},
"text": "[13]",
"orig": "[13]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.7,
"r_y0": 602.7,
"r_x1": 286.4,
"r_y1": 602.7,
"r_x2": 286.4,
"r_y2": 594.7,
"r_x3": 68.7,
"r_y3": 594.7,
"coord_origin": "TOPLEFT"
},
"text": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,",
"orig": "Thotreingam Kasar, Philippine Barlas, Sebastien Adam,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 613.7,
"r_x1": 286.4,
"r_y1": 613.7,
"r_x2": 286.4,
"r_y2": 605.7,
"r_x3": 70.0,
"r_y3": 605.7,
"coord_origin": "TOPLEFT"
},
"text": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect",
"orig": "Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 624.6,
"r_x1": 286.4,
"r_y1": 624.6,
"r_x2": 286.4,
"r_y2": 616.6,
"r_x3": 70.0,
"r_y3": 616.6,
"coord_origin": "TOPLEFT"
},
"text": "tables in scanned document images using line information.",
"orig": "tables in scanned document images using line information.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 635.6,
"r_x1": 77.5,
"r_y1": 635.6,
"r_x2": 77.5,
"r_y2": 627.6,
"r_x3": 70.0,
"r_y3": 627.6,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 79.9,
"r_y0": 635.4,
"r_x1": 286.4,
"r_y1": 635.4,
"r_x2": 286.4,
"r_y2": 627.7,
"r_x3": 79.9,
"r_y3": 627.7,
"coord_origin": "TOPLEFT"
},
"text": "2013 12th International Conference on Document Analy-",
"orig": "2013 12th International Conference on Document Analy-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 646.4,
"r_x1": 140.7,
"r_y1": 646.4,
"r_x2": 140.7,
"r_y2": 638.6,
"r_x3": 70.0,
"r_y3": 638.6,
"coord_origin": "TOPLEFT"
},
"text": "sis and Recognition",
"orig": "sis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 140.7,
"r_y0": 646.6,
"r_x1": 264.4,
"r_y1": 646.6,
"r_x2": 264.4,
"r_y2": 638.5,
"r_x3": 140.7,
"r_y3": 638.5,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1185-1189. IEEE, 2013. 2",
"orig": ", pages 1185-1189. IEEE, 2013. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[13] Thotreingam Kasar, Philippine Barlas, Sebastien Adam, Cl\u00b4ement Chatelain, and Thierry Paquet. Learning to detect tables in scanned document images using line information. In 2013 12th International Conference on Document Analysis and Recognition , pages 1185-1189. IEEE, 2013. 2"
},
{
"label": "list_item",
"id": 17,
"page_no": 8,
"cluster": {
"id": 17,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 649.8,
"r": 286.4,
"b": 679.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 657.8,
"r_x1": 66.5,
"r_y1": 657.8,
"r_x2": 66.5,
"r_y2": 649.8,
"r_x3": 50.1,
"r_y3": 649.8,
"coord_origin": "TOPLEFT"
},
"text": "[14]",
"orig": "[14]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 69.0,
"r_y0": 657.8,
"r_x1": 286.4,
"r_y1": 657.8,
"r_x2": 286.4,
"r_y2": 649.8,
"r_x3": 69.0,
"r_y3": 649.8,
"coord_origin": "TOPLEFT"
},
"text": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank",
"orig": "Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 668.8,
"r_x1": 93.2,
"r_y1": 668.8,
"r_x2": 93.2,
"r_y2": 660.8,
"r_x3": 70.0,
"r_y3": 660.8,
"coord_origin": "TOPLEFT"
},
"text": "Singh.",
"orig": "Singh.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 102.2,
"r_y0": 668.8,
"r_x1": 286.4,
"r_y1": 668.8,
"r_x2": 286.4,
"r_y2": 660.8,
"r_x3": 102.2,
"r_y3": 660.8,
"coord_origin": "TOPLEFT"
},
"text": "Icdar 2021 competition on scientific table image",
"orig": "Icdar 2021 competition on scientific table image",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 679.7,
"r_x1": 172.0,
"r_y1": 679.7,
"r_x2": 172.0,
"r_y2": 671.7,
"r_x3": 70.0,
"r_y3": 671.7,
"coord_origin": "TOPLEFT"
},
"text": "recognition to latex, 2021. 2",
"orig": "recognition to latex, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[14] Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank Singh. Icdar 2021 competition on scientific table image recognition to latex, 2021. 2"
},
{
"label": "list_item",
"id": 16,
"page_no": 8,
"cluster": {
"id": 16,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 683.0,
"r": 286.4,
"b": 712.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 691.0,
"r_x1": 65.5,
"r_y1": 691.0,
"r_x2": 65.5,
"r_y2": 683.0,
"r_x3": 50.1,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "[15]",
"orig": "[15]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 691.0,
"r_x1": 286.4,
"r_y1": 691.0,
"r_x2": 286.4,
"r_y2": 683.0,
"r_x3": 67.8,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Harold W Kuhn. The hungarian method for the assignment",
"orig": "Harold W Kuhn. The hungarian method for the assignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 702.0,
"r_x1": 102.2,
"r_y1": 702.0,
"r_x2": 102.2,
"r_y2": 694.0,
"r_x3": 70.0,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "problem.",
"orig": "problem.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 107.5,
"r_y0": 701.8,
"r_x1": 231.5,
"r_y1": 701.8,
"r_x2": 231.5,
"r_y2": 694.0,
"r_x3": 107.5,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Naval research logistics quarterly",
"orig": "Naval research logistics quarterly",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 231.5,
"r_y0": 702.0,
"r_x1": 286.4,
"r_y1": 702.0,
"r_x2": 286.4,
"r_y2": 694.0,
"r_x3": 231.5,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": ", 2(1-2):83-97,",
"orig": ", 2(1-2):83-97,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 712.9,
"r_x1": 97.9,
"r_y1": 712.9,
"r_x2": 97.9,
"r_y2": 704.9,
"r_x3": 70.0,
"r_y3": 704.9,
"coord_origin": "TOPLEFT"
},
"text": "1955. 6",
"orig": "1955. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[15] Harold W Kuhn. The hungarian method for the assignment problem. Naval research logistics quarterly , 2(1-2):83-97, 1955. 6"
},
{
"label": "list_item",
"id": 6,
"page_no": 8,
"cluster": {
"id": 6,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 75.9,
"r": 545.1,
"b": 138.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 83.9,
"r_x1": 324.7,
"r_y1": 83.9,
"r_x2": 324.7,
"r_y2": 75.9,
"r_x3": 308.9,
"r_y3": 75.9,
"coord_origin": "TOPLEFT"
},
"text": "[16]",
"orig": "[16]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.1,
"r_y0": 83.9,
"r_x1": 545.1,
"r_y1": 83.9,
"r_x2": 545.1,
"r_y2": 75.9,
"r_x3": 327.1,
"r_y3": 75.9,
"coord_origin": "TOPLEFT"
},
"text": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-",
"orig": "Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sag-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 94.9,
"r_x1": 545.1,
"r_y1": 94.9,
"r_x2": 545.1,
"r_y2": 86.8,
"r_x3": 328.8,
"r_y3": 86.8,
"coord_origin": "TOPLEFT"
},
"text": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and",
"orig": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 105.8,
"r_x1": 391.0,
"r_y1": 105.8,
"r_x2": 391.0,
"r_y2": 97.8,
"r_x3": 328.8,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Tamara L. Berg.",
"orig": "Tamara L. Berg.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.3,
"r_y0": 105.8,
"r_x1": 435.1,
"r_y1": 105.8,
"r_x2": 435.1,
"r_y2": 97.8,
"r_x3": 400.3,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Babytalk:",
"orig": "Babytalk:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 441.7,
"r_y0": 105.8,
"r_x1": 545.1,
"r_y1": 105.8,
"r_x2": 545.1,
"r_y2": 97.8,
"r_x3": 441.7,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": "Understanding and generat-",
"orig": "Understanding and generat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 116.8,
"r_x1": 440.8,
"r_y1": 116.8,
"r_x2": 440.8,
"r_y2": 108.8,
"r_x3": 328.8,
"r_y3": 108.8,
"coord_origin": "TOPLEFT"
},
"text": "ing simple image descriptions.",
"orig": "ing simple image descriptions.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 446.6,
"r_y0": 116.6,
"r_x1": 545.1,
"r_y1": 116.6,
"r_x2": 545.1,
"r_y2": 108.8,
"r_x3": 446.6,
"r_y3": 108.8,
"coord_origin": "TOPLEFT"
},
"text": "IEEE Transactions on Pat-",
"orig": "IEEE Transactions on Pat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 127.5,
"r_x1": 471.1,
"r_y1": 127.5,
"r_x2": 471.1,
"r_y2": 119.8,
"r_x3": 328.8,
"r_y3": 119.8,
"coord_origin": "TOPLEFT"
},
"text": "tern Analysis and Machine Intelligence",
"orig": "tern Analysis and Machine Intelligence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 471.1,
"r_y0": 127.7,
"r_x1": 545.1,
"r_y1": 127.7,
"r_x2": 545.1,
"r_y2": 119.7,
"r_x3": 471.1,
"r_y3": 119.7,
"coord_origin": "TOPLEFT"
},
"text": ", 35(12):2891-2903,",
"orig": ", 35(12):2891-2903,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 138.7,
"r_x1": 356.7,
"r_y1": 138.7,
"r_x2": 356.7,
"r_y2": 130.7,
"r_x3": 328.8,
"r_y3": 130.7,
"coord_origin": "TOPLEFT"
},
"text": "2013. 4",
"orig": "2013. 4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[16] Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sagnik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and Tamara L. Berg. Babytalk: Understanding and generating simple image descriptions. IEEE Transactions on Pattern Analysis and Machine Intelligence , 35(12):2891-2903, 2013. 4"
},
{
"label": "list_item",
"id": 15,
"page_no": 8,
"cluster": {
"id": 15,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 142.1,
"r": 545.1,
"b": 172.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 150.1,
"r_x1": 325.2,
"r_y1": 150.1,
"r_x2": 325.2,
"r_y2": 142.1,
"r_x3": 308.9,
"r_y3": 142.1,
"coord_origin": "TOPLEFT"
},
"text": "[17]",
"orig": "[17]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.7,
"r_y0": 150.1,
"r_x1": 545.1,
"r_y1": 150.1,
"r_x2": 545.1,
"r_y2": 142.1,
"r_x3": 327.7,
"r_y3": 142.1,
"coord_origin": "TOPLEFT"
},
"text": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming",
"orig": "Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 161.1,
"r_x1": 414.4,
"r_y1": 161.1,
"r_x2": 414.4,
"r_y2": 153.1,
"r_x3": 328.8,
"r_y3": 153.1,
"coord_origin": "TOPLEFT"
},
"text": "Zhou, and Zhoujun Li.",
"orig": "Zhou, and Zhoujun Li.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 421.8,
"r_y0": 161.1,
"r_x1": 545.1,
"r_y1": 161.1,
"r_x2": 545.1,
"r_y2": 153.1,
"r_x3": 421.8,
"r_y3": 153.1,
"coord_origin": "TOPLEFT"
},
"text": "Tablebank: A benchmark dataset",
"orig": "Tablebank: A benchmark dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 172.1,
"r_x1": 493.6,
"r_y1": 172.1,
"r_x2": 493.6,
"r_y2": 164.0,
"r_x3": 328.8,
"r_y3": 164.0,
"coord_origin": "TOPLEFT"
},
"text": "for table detection and recognition, 2019. 2, 3",
"orig": "for table detection and recognition, 2019. 2, 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[17] Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming Zhou, and Zhoujun Li. Tablebank: A benchmark dataset for table detection and recognition, 2019. 2, 3"
},
{
"label": "list_item",
"id": 12,
"page_no": 8,
"cluster": {
"id": 12,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 175.5,
"r": 545.1,
"b": 260.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 183.5,
"r_x1": 324.3,
"r_y1": 183.5,
"r_x2": 324.3,
"r_y2": 175.5,
"r_x3": 308.9,
"r_y3": 175.5,
"coord_origin": "TOPLEFT"
},
"text": "[18]",
"orig": "[18]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.6,
"r_y0": 183.5,
"r_x1": 545.1,
"r_y1": 183.5,
"r_x2": 545.1,
"r_y2": 175.5,
"r_x3": 326.6,
"r_y3": 175.5,
"coord_origin": "TOPLEFT"
},
"text": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and",
"orig": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 194.5,
"r_x1": 545.1,
"r_y1": 194.5,
"r_x2": 545.1,
"r_y2": 186.4,
"r_x3": 328.8,
"r_y3": 186.4,
"coord_origin": "TOPLEFT"
},
"text": "Xianhui Liu. Gfte: Graph-based financial table extraction.",
"orig": "Xianhui Liu. Gfte: Graph-based financial table extraction.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 205.4,
"r_x1": 545.1,
"r_y1": 205.4,
"r_x2": 545.1,
"r_y2": 197.4,
"r_x3": 328.8,
"r_y3": 197.4,
"coord_origin": "TOPLEFT"
},
"text": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-",
"orig": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 216.4,
"r_x1": 545.1,
"r_y1": 216.4,
"r_x2": 545.1,
"r_y2": 208.4,
"r_x3": 328.8,
"r_y3": 208.4,
"coord_origin": "TOPLEFT"
},
"text": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair",
"orig": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 227.3,
"r_x1": 479.3,
"r_y1": 227.3,
"r_x2": 479.3,
"r_y2": 219.3,
"r_x3": 328.8,
"r_y3": 219.3,
"coord_origin": "TOPLEFT"
},
"text": "Escalante, and Roberto Vezzani, editors,",
"orig": "Escalante, and Roberto Vezzani, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.1,
"r_y0": 227.1,
"r_x1": 545.1,
"r_y1": 227.1,
"r_x2": 545.1,
"r_y2": 219.4,
"r_x3": 483.1,
"r_y3": 219.4,
"coord_origin": "TOPLEFT"
},
"text": "Pattern Recogni-",
"orig": "Pattern Recogni-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 238.1,
"r_x1": 519.4,
"r_y1": 238.1,
"r_x2": 519.4,
"r_y2": 230.4,
"r_x3": 328.8,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "tion. ICPR International Workshops and Challenges",
"orig": "tion. ICPR International Workshops and Challenges",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 519.4,
"r_y0": 238.3,
"r_x1": 545.1,
"r_y1": 238.3,
"r_x2": 545.1,
"r_y2": 230.3,
"r_x3": 519.4,
"r_y3": 230.3,
"coord_origin": "TOPLEFT"
},
"text": ", pages",
"orig": ", pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 249.3,
"r_x1": 545.1,
"r_y1": 249.3,
"r_x2": 545.1,
"r_y2": 241.2,
"r_x3": 328.8,
"r_y3": 241.2,
"coord_origin": "TOPLEFT"
},
"text": "644-658, Cham, 2021. Springer International Publishing. 2,",
"orig": "644-658, Cham, 2021. Springer International Publishing. 2,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 260.2,
"r_x1": 333.3,
"r_y1": 260.2,
"r_x2": 333.3,
"r_y2": 252.2,
"r_x3": 328.8,
"r_y3": 252.2,
"coord_origin": "TOPLEFT"
},
"text": "3",
"orig": "3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[18] Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and Xianhui Liu. Gfte: Graph-based financial table extraction. In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Giovanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair Escalante, and Roberto Vezzani, editors, Pattern Recognition. ICPR International Workshops and Challenges , pages 644-658, Cham, 2021. Springer International Publishing. 2, 3"
},
{
"label": "list_item",
"id": 8,
"page_no": 8,
"cluster": {
"id": 8,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 263.6,
"r": 545.1,
"b": 326.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 271.7,
"r_x1": 324.3,
"r_y1": 271.7,
"r_x2": 324.3,
"r_y2": 263.6,
"r_x3": 308.9,
"r_y3": 263.6,
"coord_origin": "TOPLEFT"
},
"text": "[19]",
"orig": "[19]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.6,
"r_y0": 271.7,
"r_x1": 545.1,
"r_y1": 271.7,
"r_x2": 545.1,
"r_y2": 263.6,
"r_x3": 326.6,
"r_y3": 263.6,
"coord_origin": "TOPLEFT"
},
"text": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-",
"orig": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 282.6,
"r_x1": 545.1,
"r_y1": 282.6,
"r_x2": 545.1,
"r_y2": 274.6,
"r_x3": 328.8,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele",
"orig": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 293.6,
"r_x1": 545.1,
"r_y1": 293.6,
"r_x2": 545.1,
"r_y2": 285.6,
"r_x3": 328.8,
"r_y3": 285.6,
"coord_origin": "TOPLEFT"
},
"text": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-",
"orig": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Ro-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 304.5,
"r_x1": 545.1,
"r_y1": 304.5,
"r_x2": 545.1,
"r_y2": 296.5,
"r_x3": 328.8,
"r_y3": 296.5,
"coord_origin": "TOPLEFT"
},
"text": "bust pdf document conversion using recurrent neural net-",
"orig": "bust pdf document conversion using recurrent neural net-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 315.5,
"r_x1": 352.8,
"r_y1": 315.5,
"r_x2": 352.8,
"r_y2": 307.5,
"r_x3": 328.8,
"r_y3": 307.5,
"coord_origin": "TOPLEFT"
},
"text": "works.",
"orig": "works.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.2,
"r_y0": 315.3,
"r_x1": 545.1,
"r_y1": 315.3,
"r_x2": 545.1,
"r_y2": 307.6,
"r_x3": 360.2,
"r_y3": 307.6,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the AAAI Conference on Artificial",
"orig": "Proceedings of the AAAI Conference on Artificial",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 326.2,
"r_x1": 371.0,
"r_y1": 326.2,
"r_x2": 371.0,
"r_y2": 318.5,
"r_x3": 328.8,
"r_y3": 318.5,
"coord_origin": "TOPLEFT"
},
"text": "Intelligence",
"orig": "Intelligence",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 371.0,
"r_y0": 326.5,
"r_x1": 502.3,
"r_y1": 326.5,
"r_x2": 502.3,
"r_y2": 318.4,
"r_x3": 371.0,
"r_y3": 318.4,
"coord_origin": "TOPLEFT"
},
"text": ", 35(17):15137-15145, May 2021. 1",
"orig": ", 35(17):15137-15145, May 2021. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[19] Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Viktor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Robust pdf document conversion using recurrent neural networks. Proceedings of the AAAI Conference on Artificial Intelligence , 35(17):15137-15145, May 2021. 1"
},
{
"label": "list_item",
"id": 18,
"page_no": 8,
"cluster": {
"id": 18,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 329.9,
"r": 545.1,
"b": 370.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 337.9,
"r_x1": 323.8,
"r_y1": 337.9,
"r_x2": 323.8,
"r_y2": 329.9,
"r_x3": 308.9,
"r_y3": 329.9,
"coord_origin": "TOPLEFT"
},
"text": "[20]",
"orig": "[20]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.1,
"r_y0": 337.9,
"r_x1": 545.1,
"r_y1": 337.9,
"r_x2": 545.1,
"r_y2": 329.9,
"r_x3": 326.1,
"r_y3": 329.9,
"coord_origin": "TOPLEFT"
},
"text": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,",
"orig": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 348.9,
"r_x1": 545.1,
"r_y1": 348.9,
"r_x2": 545.1,
"r_y2": 340.8,
"r_x3": 328.8,
"r_y3": 340.8,
"coord_origin": "TOPLEFT"
},
"text": "Yongpan Wang, and Gui-Song Xia. Parsing table structures",
"orig": "Yongpan Wang, and Gui-Song Xia. Parsing table structures",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 359.8,
"r_x1": 382.8,
"r_y1": 359.8,
"r_x2": 382.8,
"r_y2": 351.8,
"r_x3": 328.8,
"r_y3": 351.8,
"coord_origin": "TOPLEFT"
},
"text": "in the wild. In",
"orig": "in the wild. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 385.5,
"r_y0": 359.6,
"r_x1": 545.1,
"r_y1": 359.6,
"r_x2": 545.1,
"r_y2": 351.9,
"r_x3": 385.5,
"r_y3": 351.9,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF International",
"orig": "Proceedings of the IEEE/CVF International",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 370.6,
"r_x1": 443.6,
"r_y1": 370.6,
"r_x2": 443.6,
"r_y2": 362.8,
"r_x3": 328.8,
"r_y3": 362.8,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision",
"orig": "Conference on Computer Vision",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 443.6,
"r_y0": 370.8,
"r_x1": 534.5,
"r_y1": 370.8,
"r_x2": 534.5,
"r_y2": 362.8,
"r_x3": 443.6,
"r_y3": 362.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 944-952, 2021. 2",
"orig": ", pages 944-952, 2021. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[20] Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang, Yongpan Wang, and Gui-Song Xia. Parsing table structures in the wild. In Proceedings of the IEEE/CVF International Conference on Computer Vision , pages 944-952, 2021. 2"
},
{
"label": "list_item",
"id": 21,
"page_no": 8,
"cluster": {
"id": 21,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 374.2,
"r": 545.1,
"b": 437.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 382.2,
"r_x1": 324.6,
"r_y1": 382.2,
"r_x2": 324.6,
"r_y2": 374.2,
"r_x3": 308.9,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "[21]",
"orig": "[21]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.0,
"r_y0": 382.2,
"r_x1": 362.7,
"r_y1": 382.2,
"r_x2": 362.7,
"r_y2": 374.2,
"r_x3": 327.0,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Shubham",
"orig": "Shubham",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 368.7,
"r_y0": 382.2,
"r_x1": 389.6,
"r_y1": 382.2,
"r_x2": 389.6,
"r_y2": 374.2,
"r_x3": 368.7,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Singh",
"orig": "Singh",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 395.6,
"r_y0": 382.2,
"r_x1": 424.6,
"r_y1": 382.2,
"r_x2": 424.6,
"r_y2": 374.2,
"r_x3": 395.6,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Paliwal,",
"orig": "Paliwal,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 431.5,
"r_y0": 382.2,
"r_x1": 438.0,
"r_y1": 382.2,
"r_x2": 438.0,
"r_y2": 374.2,
"r_x3": 431.5,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "D",
"orig": "D",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 444.1,
"r_y0": 382.2,
"r_x1": 488.5,
"r_y1": 382.2,
"r_x2": 488.5,
"r_y2": 374.2,
"r_x3": 444.1,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Vishwanath,",
"orig": "Vishwanath,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 495.5,
"r_y0": 382.2,
"r_x1": 515.4,
"r_y1": 382.2,
"r_x2": 515.4,
"r_y2": 374.2,
"r_x3": 495.5,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Rohit",
"orig": "Rohit",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 521.4,
"r_y0": 382.2,
"r_x1": 545.1,
"r_y1": 382.2,
"r_x2": 545.1,
"r_y2": 374.2,
"r_x3": 521.4,
"r_y3": 374.2,
"coord_origin": "TOPLEFT"
},
"text": "Rahul,",
"orig": "Rahul,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 393.2,
"r_x1": 545.1,
"r_y1": 393.2,
"r_x2": 545.1,
"r_y2": 385.2,
"r_x3": 328.8,
"r_y3": 385.2,
"coord_origin": "TOPLEFT"
},
"text": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-",
"orig": "Monika Sharma, and Lovekesh Vig. Tablenet: Deep learn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 404.1,
"r_x1": 545.1,
"r_y1": 404.1,
"r_x2": 545.1,
"r_y2": 396.1,
"r_x3": 328.8,
"r_y3": 396.1,
"coord_origin": "TOPLEFT"
},
"text": "ing model for end-to-end table detection and tabular data ex-",
"orig": "ing model for end-to-end table detection and tabular data ex-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 415.1,
"r_x1": 478.0,
"r_y1": 415.1,
"r_x2": 478.0,
"r_y2": 407.1,
"r_x3": 328.8,
"r_y3": 407.1,
"coord_origin": "TOPLEFT"
},
"text": "traction from scanned document images.",
"orig": "traction from scanned document images.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 484.1,
"r_y0": 415.1,
"r_x1": 491.5,
"r_y1": 415.1,
"r_x2": 491.5,
"r_y2": 407.1,
"r_x3": 484.1,
"r_y3": 407.1,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 494.7,
"r_y0": 414.9,
"r_x1": 545.1,
"r_y1": 414.9,
"r_x2": 545.1,
"r_y2": 407.2,
"r_x3": 494.7,
"r_y3": 407.2,
"coord_origin": "TOPLEFT"
},
"text": "2019 Interna-",
"orig": "2019 Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 425.9,
"r_x1": 545.1,
"r_y1": 425.9,
"r_x2": 545.1,
"r_y2": 418.1,
"r_x3": 328.8,
"r_y3": 418.1,
"coord_origin": "TOPLEFT"
},
"text": "tional Conference on Document Analysis and Recognition",
"orig": "tional Conference on Document Analysis and Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 436.8,
"r_x1": 360.8,
"r_y1": 436.8,
"r_x2": 360.8,
"r_y2": 429.1,
"r_x3": 328.8,
"r_y3": 429.1,
"coord_origin": "TOPLEFT"
},
"text": "(ICDAR)",
"orig": "(ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 360.8,
"r_y0": 437.0,
"r_x1": 475.6,
"r_y1": 437.0,
"r_x2": 475.6,
"r_y2": 429.0,
"r_x3": 360.8,
"r_y3": 429.0,
"coord_origin": "TOPLEFT"
},
"text": ", pages 128-133. IEEE, 2019. 1",
"orig": ", pages 128-133. IEEE, 2019. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[21] Shubham Singh Paliwal, D Vishwanath, Rohit Rahul, Monika Sharma, and Lovekesh Vig. Tablenet: Deep learning model for end-to-end table detection and tabular data extraction from scanned document images. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 128-133. IEEE, 2019. 1"
},
{
"label": "list_item",
"id": 20,
"page_no": 8,
"cluster": {
"id": 20,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 440.4,
"r": 545.1,
"b": 558.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 448.5,
"r_x1": 324.6,
"r_y1": 448.5,
"r_x2": 324.6,
"r_y2": 440.4,
"r_x3": 308.9,
"r_y3": 440.4,
"coord_origin": "TOPLEFT"
},
"text": "[22]",
"orig": "[22]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.9,
"r_y0": 448.5,
"r_x1": 545.1,
"r_y1": 448.5,
"r_x2": 545.1,
"r_y2": 440.4,
"r_x3": 326.9,
"r_y3": 440.4,
"coord_origin": "TOPLEFT"
},
"text": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,",
"orig": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 459.4,
"r_x1": 545.1,
"r_y1": 459.4,
"r_x2": 545.1,
"r_y2": 451.4,
"r_x3": 328.8,
"r_y3": 451.4,
"coord_origin": "TOPLEFT"
},
"text": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming",
"orig": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 470.4,
"r_x1": 545.1,
"r_y1": 470.4,
"r_x2": 545.1,
"r_y2": 462.4,
"r_x3": 328.8,
"r_y3": 462.4,
"coord_origin": "TOPLEFT"
},
"text": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,",
"orig": "Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 481.3,
"r_x1": 545.1,
"r_y1": 481.3,
"r_x2": 545.1,
"r_y2": 473.3,
"r_x3": 328.8,
"r_y3": 473.3,
"coord_origin": "TOPLEFT"
},
"text": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-",
"orig": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 492.3,
"r_x1": 545.1,
"r_y1": 492.3,
"r_x2": 545.1,
"r_y2": 484.3,
"r_x3": 328.8,
"r_y3": 484.3,
"coord_origin": "TOPLEFT"
},
"text": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,",
"orig": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 503.3,
"r_x1": 545.1,
"r_y1": 503.3,
"r_x2": 545.1,
"r_y2": 495.2,
"r_x3": 328.8,
"r_y3": 495.2,
"coord_origin": "TOPLEFT"
},
"text": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-",
"orig": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 514.2,
"r_x1": 545.1,
"r_y1": 514.2,
"r_x2": 545.1,
"r_y2": 506.2,
"r_x3": 328.8,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "perative style, high-performance deep learning library. In H.",
"orig": "perative style, high-performance deep learning library. In H.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 525.2,
"r_x1": 545.1,
"r_y1": 525.2,
"r_x2": 545.1,
"r_y2": 517.2,
"r_x3": 328.8,
"r_y3": 517.2,
"coord_origin": "TOPLEFT"
},
"text": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.",
"orig": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 536.1,
"r_x1": 434.6,
"r_y1": 536.1,
"r_x2": 434.6,
"r_y2": 528.1,
"r_x3": 328.8,
"r_y3": 528.1,
"coord_origin": "TOPLEFT"
},
"text": "Fox, and R. Garnett, editors,",
"orig": "Fox, and R. Garnett, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 437.9,
"r_y0": 535.9,
"r_x1": 545.1,
"r_y1": 535.9,
"r_x2": 545.1,
"r_y2": 528.2,
"r_x3": 437.9,
"r_y3": 528.2,
"coord_origin": "TOPLEFT"
},
"text": "Advances in Neural Informa-",
"orig": "Advances in Neural Informa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 546.9,
"r_x1": 425.7,
"r_y1": 546.9,
"r_x2": 425.7,
"r_y2": 539.2,
"r_x3": 328.8,
"r_y3": 539.2,
"coord_origin": "TOPLEFT"
},
"text": "tion Processing Systems 32",
"orig": "tion Processing Systems 32",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 425.7,
"r_y0": 547.1,
"r_x1": 545.1,
"r_y1": 547.1,
"r_x2": 545.1,
"r_y2": 539.1,
"r_x3": 425.7,
"r_y3": 539.1,
"coord_origin": "TOPLEFT"
},
"text": ", pages 8024-8035. Curran Asso-",
"orig": ", pages 8024-8035. Curran Asso-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 558.1,
"r_x1": 399.7,
"r_y1": 558.1,
"r_x2": 399.7,
"r_y2": 550.0,
"r_x3": 328.8,
"r_y3": 550.0,
"coord_origin": "TOPLEFT"
},
"text": "ciates, Inc., 2019. 6",
"orig": "ciates, Inc., 2019. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[22] Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer, James Bradbury, Gregory Chanan, Trevor Killeen, Zeming Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison, Andreas Kopf, Edward Yang, Zachary DeVito, Martin Raison, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner, Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An imperative style, high-performance deep learning library. In H. Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4e-Buc, E. Fox, and R. Garnett, editors, Advances in Neural Information Processing Systems 32 , pages 8024-8035. Curran Associates, Inc., 2019. 6"
},
{
"label": "list_item",
"id": 19,
"page_no": 8,
"cluster": {
"id": 19,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 561.5,
"r": 545.1,
"b": 624.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 569.5,
"r_x1": 324.5,
"r_y1": 569.5,
"r_x2": 324.5,
"r_y2": 561.5,
"r_x3": 308.9,
"r_y3": 561.5,
"coord_origin": "TOPLEFT"
},
"text": "[23]",
"orig": "[23]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.9,
"r_y0": 569.5,
"r_x1": 545.1,
"r_y1": 569.5,
"r_x2": 545.1,
"r_y2": 561.5,
"r_x3": 326.9,
"r_y3": 561.5,
"coord_origin": "TOPLEFT"
},
"text": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish",
"orig": "Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 580.5,
"r_x1": 545.1,
"r_y1": 580.5,
"r_x2": 545.1,
"r_y2": 572.4,
"r_x3": 328.8,
"r_y3": 572.4,
"coord_origin": "TOPLEFT"
},
"text": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach",
"orig": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 591.4,
"r_x1": 545.1,
"r_y1": 591.4,
"r_x2": 545.1,
"r_y2": 583.4,
"r_x3": 328.8,
"r_y3": 583.4,
"coord_origin": "TOPLEFT"
},
"text": "for end to end table detection and structure recognition from",
"orig": "for end to end table detection and structure recognition from",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 602.4,
"r_x1": 431.6,
"r_y1": 602.4,
"r_x2": 431.6,
"r_y2": 594.4,
"r_x3": 328.8,
"r_y3": 594.4,
"coord_origin": "TOPLEFT"
},
"text": "image-based documents. In",
"orig": "image-based documents. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 434.7,
"r_y0": 602.2,
"r_x1": 545.1,
"r_y1": 602.2,
"r_x2": 545.1,
"r_y2": 594.4,
"r_x3": 434.7,
"r_y3": 594.4,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF",
"orig": "Proceedings of the IEEE/CVF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 613.1,
"r_x1": 545.1,
"r_y1": 613.1,
"r_x2": 545.1,
"r_y2": 605.4,
"r_x3": 328.8,
"r_y3": 605.4,
"coord_origin": "TOPLEFT"
},
"text": "Conference on Computer Vision and Pattern Recognition",
"orig": "Conference on Computer Vision and Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 624.1,
"r_x1": 367.8,
"r_y1": 624.1,
"r_x2": 367.8,
"r_y2": 616.4,
"r_x3": 328.8,
"r_y3": 616.4,
"coord_origin": "TOPLEFT"
},
"text": "Workshops",
"orig": "Workshops",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 367.8,
"r_y0": 624.3,
"r_x1": 458.7,
"r_y1": 624.3,
"r_x2": 458.7,
"r_y2": 616.3,
"r_x3": 367.8,
"r_y3": 616.3,
"coord_origin": "TOPLEFT"
},
"text": ", pages 572-573, 2020. 1",
"orig": ", pages 572-573, 2020. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[23] Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish Visave, and Kavita Sultanpure. Cascadetabnet: An approach for end to end table detection and structure recognition from image-based documents. In Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition Workshops , pages 572-573, 2020. 1"
},
{
"label": "list_item",
"id": 23,
"page_no": 8,
"cluster": {
"id": 23,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 627.7,
"r": 545.1,
"b": 668.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 186,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 635.7,
"r_x1": 324.7,
"r_y1": 635.7,
"r_x2": 324.7,
"r_y2": 627.7,
"r_x3": 308.9,
"r_y3": 627.7,
"coord_origin": "TOPLEFT"
},
"text": "[24]",
"orig": "[24]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 187,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.1,
"r_y0": 635.7,
"r_x1": 545.1,
"r_y1": 635.7,
"r_x2": 545.1,
"r_y2": 627.7,
"r_x3": 327.1,
"r_y3": 627.7,
"coord_origin": "TOPLEFT"
},
"text": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.",
"orig": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 188,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 646.7,
"r_x1": 545.1,
"r_y1": 646.7,
"r_x2": 545.1,
"r_y2": 638.7,
"r_x3": 328.8,
"r_y3": 638.7,
"coord_origin": "TOPLEFT"
},
"text": "Rethinking table recognition using graph neural networks.",
"orig": "Rethinking table recognition using graph neural networks.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 189,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 657.7,
"r_x1": 336.3,
"r_y1": 657.7,
"r_x2": 336.3,
"r_y2": 649.6,
"r_x3": 328.8,
"r_y3": 649.6,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 190,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 338.1,
"r_y0": 657.4,
"r_x1": 545.1,
"r_y1": 657.4,
"r_x2": 545.1,
"r_y2": 649.7,
"r_x3": 338.1,
"r_y3": 649.7,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 191,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 668.4,
"r_x1": 406.3,
"r_y1": 668.4,
"r_x2": 406.3,
"r_y2": 660.7,
"r_x3": 328.8,
"r_y3": 660.7,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 192,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.3,
"r_y0": 668.6,
"r_x1": 521.1,
"r_y1": 668.6,
"r_x2": 521.1,
"r_y2": 660.6,
"r_x3": 406.3,
"r_y3": 660.6,
"coord_origin": "TOPLEFT"
},
"text": ", pages 142-147. IEEE, 2019. 3",
"orig": ", pages 142-147. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[24] Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait. Rethinking table recognition using graph neural networks. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 142-147. IEEE, 2019. 3"
},
{
"label": "list_item",
"id": 24,
"page_no": 8,
"cluster": {
"id": 24,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 672.0,
"r": 545.1,
"b": 712.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.87,
"cells": [
{
"index": 193,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 680.1,
"r_x1": 324.7,
"r_y1": 680.1,
"r_x2": 324.7,
"r_y2": 672.0,
"r_x3": 308.9,
"r_y3": 672.0,
"coord_origin": "TOPLEFT"
},
"text": "[25]",
"orig": "[25]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 194,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.1,
"r_y0": 680.1,
"r_x1": 545.1,
"r_y1": 680.1,
"r_x2": 545.1,
"r_y2": 672.0,
"r_x3": 327.1,
"r_y3": 672.0,
"coord_origin": "TOPLEFT"
},
"text": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir",
"orig": "Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 195,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 691.0,
"r_x1": 482.8,
"r_y1": 691.0,
"r_x2": 482.8,
"r_y2": 683.0,
"r_x3": 328.8,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Sadeghian, Ian Reid, and Silvio Savarese.",
"orig": "Sadeghian, Ian Reid, and Silvio Savarese.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 196,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.8,
"r_y0": 691.0,
"r_x1": 545.1,
"r_y1": 691.0,
"r_x2": 545.1,
"r_y2": 683.0,
"r_x3": 488.8,
"r_y3": 683.0,
"coord_origin": "TOPLEFT"
},
"text": "Generalized in-",
"orig": "Generalized in-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 197,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 702.0,
"r_x1": 545.1,
"r_y1": 702.0,
"r_x2": 545.1,
"r_y2": 694.0,
"r_x3": 328.8,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "tersection over union: A metric and a loss for bounding box",
"orig": "tersection over union: A metric and a loss for bounding box",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 198,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 712.9,
"r_x1": 379.2,
"r_y1": 712.9,
"r_x2": 379.2,
"r_y2": 704.9,
"r_x3": 328.8,
"r_y3": 704.9,
"coord_origin": "TOPLEFT"
},
"text": "regression. In",
"orig": "regression. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 199,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 381.6,
"r_y0": 712.7,
"r_x1": 545.1,
"r_y1": 712.7,
"r_x2": 545.1,
"r_y2": 705.0,
"r_x3": 381.6,
"r_y3": 705.0,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE/CVF Conference on",
"orig": "Proceedings of the IEEE/CVF Conference on",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[25] Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir Sadeghian, Ian Reid, and Silvio Savarese. Generalized intersection over union: A metric and a loss for bounding box regression. In Proceedings of the IEEE/CVF Conference on"
}
],
"headers": [
{
"label": "page_footer",
"id": 22,
"page_no": 8,
"cluster": {
"id": 22,
"label": "page_footer",
"bbox": {
"l": 295.1,
"t": 734.1,
"r": 300.1,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 200,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 295.1,
"r_y0": 743.0,
"r_x1": 300.1,
"r_y1": 743.0,
"r_x2": 300.1,
"r_y2": 734.1,
"r_x3": 295.1,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "9",
"orig": "9",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9"
}
]
}
},
{
"page_no": 9,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 83.7,
"r_x1": 223.6,
"r_y1": 83.7,
"r_x2": 223.6,
"r_y2": 76.0,
"r_x3": 70.0,
"r_y3": 76.0,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision and Pattern Recognition",
"orig": "Computer Vision and Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 223.6,
"r_y0": 83.9,
"r_x1": 286.4,
"r_y1": 83.9,
"r_x2": 286.4,
"r_y2": 75.9,
"r_x3": 223.6,
"r_y3": 75.9,
"coord_origin": "TOPLEFT"
},
"text": ", pages 658-666,",
"orig": ", pages 658-666,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 94.9,
"r_x1": 97.9,
"r_y1": 94.9,
"r_x2": 97.9,
"r_y2": 86.8,
"r_x3": 70.0,
"r_y3": 86.8,
"coord_origin": "TOPLEFT"
},
"text": "2019. 6",
"orig": "2019. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 106.2,
"r_x1": 65.5,
"r_y1": 106.2,
"r_x2": 65.5,
"r_y2": 98.2,
"r_x3": 50.1,
"r_y3": 98.2,
"coord_origin": "TOPLEFT"
},
"text": "[26]",
"orig": "[26]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 106.2,
"r_x1": 286.4,
"r_y1": 106.2,
"r_x2": 286.4,
"r_y2": 98.2,
"r_x3": 67.8,
"r_y3": 98.2,
"coord_origin": "TOPLEFT"
},
"text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 117.1,
"r_x1": 286.4,
"r_y1": 117.1,
"r_x2": 286.4,
"r_y2": 109.1,
"r_x3": 70.0,
"r_y3": 109.1,
"coord_origin": "TOPLEFT"
},
"text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-",
"orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 128.1,
"r_x1": 286.4,
"r_y1": 128.1,
"r_x2": 286.4,
"r_y2": 120.1,
"r_x3": 70.0,
"r_y3": 120.1,
"coord_origin": "TOPLEFT"
},
"text": "tion and structure recognition of tables in document images.",
"orig": "tion and structure recognition of tables in document images.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 139.1,
"r_x1": 77.5,
"r_y1": 139.1,
"r_x2": 77.5,
"r_y2": 131.0,
"r_x3": 70.0,
"r_y3": 131.0,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 80.6,
"r_y0": 138.9,
"r_x1": 286.4,
"r_y1": 138.9,
"r_x2": 286.4,
"r_y2": 131.1,
"r_x3": 80.6,
"r_y3": 131.1,
"coord_origin": "TOPLEFT"
},
"text": "2017 14th IAPR International Conference on Document",
"orig": "2017 14th IAPR International Conference on Document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 149.8,
"r_x1": 195.2,
"r_y1": 149.8,
"r_x2": 195.2,
"r_y2": 142.1,
"r_x3": 70.0,
"r_y3": 142.1,
"coord_origin": "TOPLEFT"
},
"text": "Analysis and Recognition (ICDAR)",
"orig": "Analysis and Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 195.2,
"r_y0": 150.0,
"r_x1": 286.4,
"r_y1": 150.0,
"r_x2": 286.4,
"r_y2": 142.0,
"r_x3": 195.2,
"r_y3": 142.0,
"coord_origin": "TOPLEFT"
},
"text": ", volume 01, pages 1162-",
"orig": ", volume 01, pages 1162-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 161.0,
"r_x1": 120.3,
"r_y1": 161.0,
"r_x2": 120.3,
"r_y2": 153.0,
"r_x3": 70.0,
"r_y3": 153.0,
"coord_origin": "TOPLEFT"
},
"text": "1167, 2017. 1",
"orig": "1167, 2017. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 172.3,
"r_x1": 65.5,
"r_y1": 172.3,
"r_x2": 65.5,
"r_y2": 164.3,
"r_x3": 50.1,
"r_y3": 164.3,
"coord_origin": "TOPLEFT"
},
"text": "[27]",
"orig": "[27]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 172.3,
"r_x1": 286.4,
"r_y1": 172.3,
"r_x2": 286.4,
"r_y2": 164.3,
"r_x3": 67.8,
"r_y3": 164.3,
"coord_origin": "TOPLEFT"
},
"text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 183.3,
"r_x1": 286.4,
"r_y1": 183.3,
"r_x2": 286.4,
"r_y2": 175.2,
"r_x3": 70.0,
"r_y3": 175.2,
"coord_origin": "TOPLEFT"
},
"text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-",
"orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 194.2,
"r_x1": 286.4,
"r_y1": 194.2,
"r_x2": 286.4,
"r_y2": 186.2,
"r_x3": 70.0,
"r_y3": 186.2,
"coord_origin": "TOPLEFT"
},
"text": "tection and structure recognition of tables in document im-",
"orig": "tection and structure recognition of tables in document im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 205.2,
"r_x1": 101.3,
"r_y1": 205.2,
"r_x2": 101.3,
"r_y2": 197.2,
"r_x3": 70.0,
"r_y3": 197.2,
"coord_origin": "TOPLEFT"
},
"text": "ages. In",
"orig": "ages. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 104.3,
"r_y0": 205.0,
"r_x1": 286.4,
"r_y1": 205.0,
"r_x2": 286.4,
"r_y2": 197.2,
"r_x3": 104.3,
"r_y3": 197.2,
"coord_origin": "TOPLEFT"
},
"text": "2017 14th IAPR international conference on doc-",
"orig": "2017 14th IAPR international conference on doc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 215.9,
"r_x1": 220.5,
"r_y1": 215.9,
"r_x2": 220.5,
"r_y2": 208.2,
"r_x3": 70.0,
"r_y3": 208.2,
"coord_origin": "TOPLEFT"
},
"text": "ument analysis and recognition (ICDAR)",
"orig": "ument analysis and recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.5,
"r_y0": 216.1,
"r_x1": 286.4,
"r_y1": 216.1,
"r_x2": 286.4,
"r_y2": 208.1,
"r_x3": 220.5,
"r_y3": 208.1,
"coord_origin": "TOPLEFT"
},
"text": ", volume 1, pages",
"orig": ", volume 1, pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 227.1,
"r_x1": 166.7,
"r_y1": 227.1,
"r_x2": 166.7,
"r_y2": 219.1,
"r_x3": 70.0,
"r_y3": 219.1,
"coord_origin": "TOPLEFT"
},
"text": "1162-1167. IEEE, 2017. 3",
"orig": "1162-1167. IEEE, 2017. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 238.4,
"r_x1": 65.7,
"r_y1": 238.4,
"r_x2": 65.7,
"r_y2": 230.4,
"r_x3": 50.1,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "[28]",
"orig": "[28]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.0,
"r_y0": 238.4,
"r_x1": 286.4,
"r_y1": 238.4,
"r_x2": 286.4,
"r_y2": 230.4,
"r_x3": 68.0,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "Faisal Shafait and Ray Smith. Table detection in heteroge-",
"orig": "Faisal Shafait and Ray Smith. Table detection in heteroge-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 249.4,
"r_x1": 147.2,
"r_y1": 249.4,
"r_x2": 147.2,
"r_y2": 241.4,
"r_x3": 70.0,
"r_y3": 241.4,
"coord_origin": "TOPLEFT"
},
"text": "neous documents. In",
"orig": "neous documents. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 149.9,
"r_y0": 249.2,
"r_x1": 286.4,
"r_y1": 249.2,
"r_x2": 286.4,
"r_y2": 241.4,
"r_x3": 149.9,
"r_y3": 241.4,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the 9th IAPR Interna-",
"orig": "Proceedings of the 9th IAPR Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 260.1,
"r_x1": 244.7,
"r_y1": 260.1,
"r_x2": 244.7,
"r_y2": 252.4,
"r_x3": 70.0,
"r_y3": 252.4,
"coord_origin": "TOPLEFT"
},
"text": "tional Workshop on Document Analysis Systems",
"orig": "tional Workshop on Document Analysis Systems",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 244.7,
"r_y0": 260.3,
"r_x1": 286.4,
"r_y1": 260.3,
"r_x2": 286.4,
"r_y2": 252.3,
"r_x3": 244.7,
"r_y3": 252.3,
"coord_origin": "TOPLEFT"
},
"text": ", pages 65-",
"orig": ", pages 65-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 271.3,
"r_x1": 111.4,
"r_y1": 271.3,
"r_x2": 111.4,
"r_y2": 263.3,
"r_x3": 70.0,
"r_y3": 263.3,
"coord_origin": "TOPLEFT"
},
"text": "72, 2010. 2",
"orig": "72, 2010. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 282.6,
"r_x1": 66.0,
"r_y1": 282.6,
"r_x2": 66.0,
"r_y2": 274.6,
"r_x3": 50.1,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "[29]",
"orig": "[29]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.4,
"r_y0": 282.6,
"r_x1": 94.9,
"r_y1": 282.6,
"r_x2": 94.9,
"r_y2": 274.6,
"r_x3": 68.4,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Shoaib",
"orig": "Shoaib",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 100.9,
"r_y0": 282.6,
"r_x1": 127.3,
"r_y1": 282.6,
"r_x2": 127.3,
"r_y2": 274.6,
"r_x3": 100.9,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Ahmed",
"orig": "Ahmed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 133.2,
"r_y0": 282.6,
"r_x1": 165.8,
"r_y1": 282.6,
"r_x2": 165.8,
"r_y2": 274.6,
"r_x3": 133.2,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Siddiqui,",
"orig": "Siddiqui,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 172.7,
"r_y0": 282.6,
"r_x1": 194.1,
"r_y1": 282.6,
"r_x2": 194.1,
"r_y2": 274.6,
"r_x3": 172.7,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Imran",
"orig": "Imran",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.0,
"r_y0": 282.6,
"r_x1": 211.5,
"r_y1": 282.6,
"r_x2": 211.5,
"r_y2": 274.6,
"r_x3": 200.0,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Ali",
"orig": "Ali",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 217.4,
"r_y0": 282.6,
"r_x1": 239.4,
"r_y1": 282.6,
"r_x2": 239.4,
"r_y2": 274.6,
"r_x3": 217.4,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Fateh,",
"orig": "Fateh,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.3,
"r_y0": 282.6,
"r_x1": 264.2,
"r_y1": 282.6,
"r_x2": 264.2,
"r_y2": 274.6,
"r_x3": 246.3,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Syed",
"orig": "Syed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 270.1,
"r_y0": 282.6,
"r_x1": 286.4,
"r_y1": 282.6,
"r_x2": 286.4,
"r_y2": 274.6,
"r_x3": 270.1,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Tah-",
"orig": "Tah-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 293.6,
"r_x1": 286.4,
"r_y1": 293.6,
"r_x2": 286.4,
"r_y2": 285.6,
"r_x3": 70.0,
"r_y3": 285.6,
"coord_origin": "TOPLEFT"
},
"text": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.",
"orig": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 304.5,
"r_x1": 286.4,
"r_y1": 304.5,
"r_x2": 286.4,
"r_y2": 296.5,
"r_x3": 70.0,
"r_y3": 296.5,
"coord_origin": "TOPLEFT"
},
"text": "Deeptabstr: Deep learning based table structure recognition.",
"orig": "Deeptabstr: Deep learning based table structure recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 315.5,
"r_x1": 77.5,
"r_y1": 315.5,
"r_x2": 77.5,
"r_y2": 307.5,
"r_x3": 70.0,
"r_y3": 307.5,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 79.4,
"r_y0": 315.3,
"r_x1": 286.4,
"r_y1": 315.3,
"r_x2": 286.4,
"r_y2": 307.6,
"r_x3": 79.4,
"r_y3": 307.6,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 326.2,
"r_x1": 147.6,
"r_y1": 326.2,
"r_x2": 147.6,
"r_y2": 318.5,
"r_x3": 70.0,
"r_y3": 318.5,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 147.6,
"r_y0": 326.5,
"r_x1": 271.3,
"r_y1": 326.5,
"r_x2": 271.3,
"r_y2": 318.4,
"r_x3": 147.6,
"r_y3": 318.4,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1403-1409. IEEE, 2019. 3",
"orig": ", pages 1403-1409. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 337.8,
"r_x1": 65.4,
"r_y1": 337.8,
"r_x2": 65.4,
"r_y2": 329.8,
"r_x3": 50.1,
"r_y3": 329.8,
"coord_origin": "TOPLEFT"
},
"text": "[30]",
"orig": "[30]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.7,
"r_y0": 337.8,
"r_x1": 286.4,
"r_y1": 337.8,
"r_x2": 286.4,
"r_y2": 329.8,
"r_x3": 67.7,
"r_y3": 329.8,
"coord_origin": "TOPLEFT"
},
"text": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas",
"orig": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 348.7,
"r_x1": 286.4,
"r_y1": 348.7,
"r_x2": 286.4,
"r_y2": 340.7,
"r_x3": 70.0,
"r_y3": 340.7,
"coord_origin": "TOPLEFT"
},
"text": "Bekas. Corpus conversion service: A machine learning plat-",
"orig": "Bekas. Corpus conversion service: A machine learning plat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 359.7,
"r_x1": 198.8,
"r_y1": 359.7,
"r_x2": 198.8,
"r_y2": 351.7,
"r_x3": 70.0,
"r_y3": 351.7,
"coord_origin": "TOPLEFT"
},
"text": "form to ingest documents at scale.",
"orig": "form to ingest documents at scale.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.1,
"r_y0": 359.7,
"r_x1": 213.5,
"r_y1": 359.7,
"r_x2": 213.5,
"r_y2": 351.7,
"r_x3": 206.1,
"r_y3": 351.7,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 217.0,
"r_y0": 359.5,
"r_x1": 286.4,
"r_y1": 359.5,
"r_x2": 286.4,
"r_y2": 351.8,
"r_x3": 217.0,
"r_y3": 351.8,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the",
"orig": "Proceedings of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 370.4,
"r_x1": 143.1,
"r_y1": 370.4,
"r_x2": 143.1,
"r_y2": 362.7,
"r_x3": 70.0,
"r_y3": 362.7,
"coord_origin": "TOPLEFT"
},
"text": "24th ACM SIGKDD",
"orig": "24th ACM SIGKDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.1,
"r_y0": 370.7,
"r_x1": 286.4,
"r_y1": 370.7,
"r_x2": 286.4,
"r_y2": 362.6,
"r_x3": 143.1,
"r_y3": 362.6,
"coord_origin": "TOPLEFT"
},
"text": ", KDD \u201918, pages 774-782, New York,",
"orig": ", KDD \u201918, pages 774-782, New York,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 381.6,
"r_x1": 161.2,
"r_y1": 381.6,
"r_x2": 161.2,
"r_y2": 373.6,
"r_x3": 70.0,
"r_y3": 373.6,
"coord_origin": "TOPLEFT"
},
"text": "NY, USA, 2018. ACM. 1",
"orig": "NY, USA, 2018. ACM. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 392.9,
"r_x1": 65.1,
"r_y1": 392.9,
"r_x2": 65.1,
"r_y2": 384.9,
"r_x3": 50.1,
"r_y3": 384.9,
"coord_origin": "TOPLEFT"
},
"text": "[31]",
"orig": "[31]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.4,
"r_y0": 392.9,
"r_x1": 286.4,
"r_y1": 392.9,
"r_x2": 286.4,
"r_y2": 384.9,
"r_x3": 67.4,
"r_y3": 384.9,
"coord_origin": "TOPLEFT"
},
"text": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-",
"orig": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 403.9,
"r_x1": 286.4,
"r_y1": 403.9,
"r_x2": 286.4,
"r_y2": 395.9,
"r_x3": 70.0,
"r_y3": 395.9,
"coord_origin": "TOPLEFT"
},
"text": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-",
"orig": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 414.9,
"r_x1": 125.5,
"r_y1": 414.9,
"r_x2": 125.5,
"r_y2": 406.8,
"r_x3": 70.0,
"r_y3": 406.8,
"coord_origin": "TOPLEFT"
},
"text": "lia Polosukhin.",
"orig": "lia Polosukhin.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 133.9,
"r_y0": 414.9,
"r_x1": 230.8,
"r_y1": 414.9,
"r_x2": 230.8,
"r_y2": 406.8,
"r_x3": 133.9,
"r_y3": 406.8,
"coord_origin": "TOPLEFT"
},
"text": "Attention is all you need.",
"orig": "Attention is all you need.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.3,
"r_y0": 414.9,
"r_x1": 286.4,
"r_y1": 414.9,
"r_x2": 286.4,
"r_y2": 406.8,
"r_x3": 239.3,
"r_y3": 406.8,
"coord_origin": "TOPLEFT"
},
"text": "In I. Guyon,",
"orig": "In I. Guyon,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 425.8,
"r_x1": 79.0,
"r_y1": 425.8,
"r_x2": 79.0,
"r_y2": 417.8,
"r_x3": 70.0,
"r_y3": 417.8,
"coord_origin": "TOPLEFT"
},
"text": "U.",
"orig": "U.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.3,
"r_y0": 425.8,
"r_x1": 286.4,
"r_y1": 425.8,
"r_x2": 286.4,
"r_y2": 417.8,
"r_x3": 81.3,
"r_y3": 417.8,
"coord_origin": "TOPLEFT"
},
"text": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-",
"orig": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 436.8,
"r_x1": 196.8,
"r_y1": 436.8,
"r_x2": 196.8,
"r_y2": 428.8,
"r_x3": 70.0,
"r_y3": 428.8,
"coord_origin": "TOPLEFT"
},
"text": "wanathan, and R. Garnett, editors,",
"orig": "wanathan, and R. Garnett, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.2,
"r_y0": 436.6,
"r_x1": 286.4,
"r_y1": 436.6,
"r_x2": 286.4,
"r_y2": 428.8,
"r_x3": 200.2,
"r_y3": 428.8,
"coord_origin": "TOPLEFT"
},
"text": "Advances in Neural In-",
"orig": "Advances in Neural In-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 447.5,
"r_x1": 189.2,
"r_y1": 447.5,
"r_x2": 189.2,
"r_y2": 439.8,
"r_x3": 70.0,
"r_y3": 439.8,
"coord_origin": "TOPLEFT"
},
"text": "formation Processing Systems 30",
"orig": "formation Processing Systems 30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.2,
"r_y0": 447.7,
"r_x1": 286.4,
"r_y1": 447.7,
"r_x2": 286.4,
"r_y2": 439.7,
"r_x3": 189.2,
"r_y3": 439.7,
"coord_origin": "TOPLEFT"
},
"text": ", pages 5998-6008. Curran",
"orig": ", pages 5998-6008. Curran",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 458.7,
"r_x1": 158.9,
"r_y1": 458.7,
"r_x2": 158.9,
"r_y2": 450.7,
"r_x3": 70.0,
"r_y3": 450.7,
"coord_origin": "TOPLEFT"
},
"text": "Associates, Inc., 2017. 5",
"orig": "Associates, Inc., 2017. 5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 470.0,
"r_x1": 65.9,
"r_y1": 470.0,
"r_x2": 65.9,
"r_y2": 462.0,
"r_x3": 50.1,
"r_y3": 462.0,
"coord_origin": "TOPLEFT"
},
"text": "[32]",
"orig": "[32]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.3,
"r_y0": 470.0,
"r_x1": 286.4,
"r_y1": 470.0,
"r_x2": 286.4,
"r_y2": 462.0,
"r_x3": 68.3,
"r_y3": 462.0,
"coord_origin": "TOPLEFT"
},
"text": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-",
"orig": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 481.0,
"r_x1": 116.3,
"r_y1": 481.0,
"r_x2": 116.3,
"r_y2": 473.0,
"r_x3": 70.0,
"r_y3": 473.0,
"coord_origin": "TOPLEFT"
},
"text": "mitru Erhan.",
"orig": "mitru Erhan.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.5,
"r_y0": 481.0,
"r_x1": 286.4,
"r_y1": 481.0,
"r_x2": 286.4,
"r_y2": 473.0,
"r_x3": 122.5,
"r_y3": 473.0,
"coord_origin": "TOPLEFT"
},
"text": "Show and tell: A neural image caption gen-",
"orig": "Show and tell: A neural image caption gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 491.9,
"r_x1": 103.3,
"r_y1": 491.9,
"r_x2": 103.3,
"r_y2": 483.9,
"r_x3": 70.0,
"r_y3": 483.9,
"coord_origin": "TOPLEFT"
},
"text": "erator. In",
"orig": "erator. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 105.5,
"r_y0": 491.7,
"r_x1": 286.4,
"r_y1": 491.7,
"r_x2": 286.4,
"r_y2": 484.0,
"r_x3": 105.5,
"r_y3": 484.0,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE Conference on Computer",
"orig": "Proceedings of the IEEE Conference on Computer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 502.7,
"r_x1": 212.5,
"r_y1": 502.7,
"r_x2": 212.5,
"r_y2": 495.0,
"r_x3": 70.0,
"r_y3": 495.0,
"coord_origin": "TOPLEFT"
},
"text": "Vision and Pattern Recognition (CVPR)",
"orig": "Vision and Pattern Recognition (CVPR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 212.5,
"r_y0": 502.9,
"r_x1": 263.6,
"r_y1": 502.9,
"r_x2": 263.6,
"r_y2": 494.9,
"r_x3": 212.5,
"r_y3": 494.9,
"coord_origin": "TOPLEFT"
},
"text": ", June 2015. 2",
"orig": ", June 2015. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 514.2,
"r_x1": 65.7,
"r_y1": 514.2,
"r_x2": 65.7,
"r_y2": 506.2,
"r_x3": 50.1,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "[33]",
"orig": "[33]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.0,
"r_y0": 514.2,
"r_x1": 247.4,
"r_y1": 514.2,
"r_x2": 247.4,
"r_y2": 506.2,
"r_x3": 68.0,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.",
"orig": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 254.0,
"r_y0": 514.2,
"r_x1": 286.4,
"r_y1": 514.2,
"r_x2": 286.4,
"r_y2": 506.2,
"r_x3": 254.0,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "Res2tim:",
"orig": "Res2tim:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 525.2,
"r_x1": 265.6,
"r_y1": 525.2,
"r_x2": 265.6,
"r_y2": 517.2,
"r_x3": 70.0,
"r_y3": 517.2,
"coord_origin": "TOPLEFT"
},
"text": "reconstruct syntactic structures from table images. In",
"orig": "reconstruct syntactic structures from table images. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 268.4,
"r_y0": 525.0,
"r_x1": 286.4,
"r_y1": 525.0,
"r_x2": 286.4,
"r_y2": 517.2,
"r_x3": 268.4,
"r_y3": 517.2,
"coord_origin": "TOPLEFT"
},
"text": "2019",
"orig": "2019",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 535.9,
"r_x1": 286.4,
"r_y1": 535.9,
"r_x2": 286.4,
"r_y2": 528.2,
"r_x3": 70.0,
"r_y3": 528.2,
"coord_origin": "TOPLEFT"
},
"text": "International Conference on Document Analysis and Recog-",
"orig": "International Conference on Document Analysis and Recog-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 546.9,
"r_x1": 125.3,
"r_y1": 546.9,
"r_x2": 125.3,
"r_y2": 539.2,
"r_x3": 70.0,
"r_y3": 539.2,
"coord_origin": "TOPLEFT"
},
"text": "nition (ICDAR)",
"orig": "nition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.3,
"r_y0": 547.1,
"r_x1": 240.1,
"r_y1": 547.1,
"r_x2": 240.1,
"r_y2": 539.1,
"r_x3": 125.3,
"r_y3": 539.1,
"coord_origin": "TOPLEFT"
},
"text": ", pages 749-755. IEEE, 2019. 3",
"orig": ", pages 749-755. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 558.4,
"r_x1": 66.0,
"r_y1": 558.4,
"r_x2": 66.0,
"r_y2": 550.4,
"r_x3": 50.1,
"r_y3": 550.4,
"coord_origin": "TOPLEFT"
},
"text": "[34]",
"orig": "[34]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.4,
"r_y0": 558.4,
"r_x1": 286.4,
"r_y1": 558.4,
"r_x2": 286.4,
"r_y2": 550.4,
"r_x3": 68.4,
"r_y3": 550.4,
"coord_origin": "TOPLEFT"
},
"text": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,",
"orig": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 569.4,
"r_x1": 137.1,
"r_y1": 569.4,
"r_x2": 137.1,
"r_y2": 561.4,
"r_x3": 70.0,
"r_y3": 561.4,
"coord_origin": "TOPLEFT"
},
"text": "and Qingyong Li.",
"orig": "and Qingyong Li.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 146.0,
"r_y0": 569.4,
"r_x1": 172.4,
"r_y1": 569.4,
"r_x2": 172.4,
"r_y2": 561.4,
"r_x3": 146.0,
"r_y3": 561.4,
"coord_origin": "TOPLEFT"
},
"text": "Tgrnet:",
"orig": "Tgrnet:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 178.7,
"r_y0": 569.4,
"r_x1": 286.4,
"r_y1": 569.4,
"r_x2": 286.4,
"r_y2": 561.4,
"r_x3": 178.7,
"r_y3": 561.4,
"coord_origin": "TOPLEFT"
},
"text": "A table graph reconstruction",
"orig": "A table graph reconstruction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 580.3,
"r_x1": 221.0,
"r_y1": 580.3,
"r_x2": 221.0,
"r_y2": 572.3,
"r_x3": 70.0,
"r_y3": 572.3,
"coord_origin": "TOPLEFT"
},
"text": "network for table structure recognition.",
"orig": "network for table structure recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.5,
"r_y0": 580.1,
"r_x1": 286.4,
"r_y1": 580.1,
"r_x2": 286.4,
"r_y2": 572.4,
"r_x3": 232.5,
"r_y3": 572.4,
"coord_origin": "TOPLEFT"
},
"text": "arXiv preprint",
"orig": "arXiv preprint",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 591.1,
"r_x1": 135.5,
"r_y1": 591.1,
"r_x2": 135.5,
"r_y2": 583.4,
"r_x3": 70.0,
"r_y3": 583.4,
"coord_origin": "TOPLEFT"
},
"text": "arXiv:2106.10598",
"orig": "arXiv:2106.10598",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 135.5,
"r_y0": 591.3,
"r_x1": 167.9,
"r_y1": 591.3,
"r_x2": 167.9,
"r_y2": 583.3,
"r_x3": 135.5,
"r_y3": 583.3,
"coord_origin": "TOPLEFT"
},
"text": ", 2021. 3",
"orig": ", 2021. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 602.6,
"r_x1": 65.2,
"r_y1": 602.6,
"r_x2": 65.2,
"r_y2": 594.6,
"r_x3": 50.1,
"r_y3": 594.6,
"coord_origin": "TOPLEFT"
},
"text": "[35]",
"orig": "[35]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.5,
"r_y0": 602.6,
"r_x1": 286.4,
"r_y1": 602.6,
"r_x2": 286.4,
"r_y2": 594.6,
"r_x3": 67.5,
"r_y3": 594.6,
"coord_origin": "TOPLEFT"
},
"text": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and",
"orig": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 613.6,
"r_x1": 109.1,
"r_y1": 613.6,
"r_x2": 109.1,
"r_y2": 605.6,
"r_x3": 70.0,
"r_y3": 605.6,
"coord_origin": "TOPLEFT"
},
"text": "Jiebo Luo.",
"orig": "Jiebo Luo.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.2,
"r_y0": 613.6,
"r_x1": 271.8,
"r_y1": 613.6,
"r_x2": 271.8,
"r_y2": 605.6,
"r_x3": 116.2,
"r_y3": 605.6,
"coord_origin": "TOPLEFT"
},
"text": "Image captioning with semantic attention.",
"orig": "Image captioning with semantic attention.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.9,
"r_y0": 613.6,
"r_x1": 286.4,
"r_y1": 613.6,
"r_x2": 286.4,
"r_y2": 605.6,
"r_x3": 278.9,
"r_y3": 605.6,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 624.3,
"r_x1": 286.4,
"r_y1": 624.3,
"r_x2": 286.4,
"r_y2": 616.6,
"r_x3": 70.0,
"r_y3": 616.6,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE conference on computer vision and",
"orig": "Proceedings of the IEEE conference on computer vision and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 635.3,
"r_x1": 139.1,
"r_y1": 635.3,
"r_x2": 139.1,
"r_y2": 627.6,
"r_x3": 70.0,
"r_y3": 627.6,
"coord_origin": "TOPLEFT"
},
"text": "pattern recognition",
"orig": "pattern recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 139.1,
"r_y0": 635.5,
"r_x1": 239.0,
"r_y1": 635.5,
"r_x2": 239.0,
"r_y2": 627.5,
"r_x3": 139.1,
"r_y3": 627.5,
"coord_origin": "TOPLEFT"
},
"text": ", pages 4651-4659, 2016. 4",
"orig": ", pages 4651-4659, 2016. 4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 646.8,
"r_x1": 65.2,
"r_y1": 646.8,
"r_x2": 65.2,
"r_y2": 638.8,
"r_x3": 50.1,
"r_y3": 638.8,
"coord_origin": "TOPLEFT"
},
"text": "[36]",
"orig": "[36]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.5,
"r_y0": 646.8,
"r_x1": 286.4,
"r_y1": 646.8,
"r_x2": 286.4,
"r_y2": 638.8,
"r_x3": 67.5,
"r_y3": 638.8,
"coord_origin": "TOPLEFT"
},
"text": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and",
"orig": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 657.8,
"r_x1": 286.4,
"r_y1": 657.8,
"r_x2": 286.4,
"r_y2": 649.8,
"r_x3": 70.0,
"r_y3": 649.8,
"coord_origin": "TOPLEFT"
},
"text": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-",
"orig": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 668.7,
"r_x1": 286.4,
"r_y1": 668.7,
"r_x2": 286.4,
"r_y2": 660.7,
"r_x3": 70.0,
"r_y3": 660.7,
"coord_origin": "TOPLEFT"
},
"text": "work for joint table identification and cell structure recogni-",
"orig": "work for joint table identification and cell structure recogni-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 679.7,
"r_x1": 158.5,
"r_y1": 679.7,
"r_x2": 158.5,
"r_y2": 671.7,
"r_x3": 70.0,
"r_y3": 671.7,
"coord_origin": "TOPLEFT"
},
"text": "tion using visual context.",
"orig": "tion using visual context.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.5,
"r_y0": 679.5,
"r_x1": 286.4,
"r_y1": 679.5,
"r_x2": 286.4,
"r_y2": 671.8,
"r_x3": 160.5,
"r_y3": 671.8,
"coord_origin": "TOPLEFT"
},
"text": "Winter Conference for Applications",
"orig": "Winter Conference for Applications",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 690.4,
"r_x1": 171.4,
"r_y1": 690.4,
"r_x2": 171.4,
"r_y2": 682.7,
"r_x3": 70.0,
"r_y3": 682.7,
"coord_origin": "TOPLEFT"
},
"text": "in Computer Vision (WACV)",
"orig": "in Computer Vision (WACV)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.4,
"r_y0": 690.7,
"r_x1": 212.8,
"r_y1": 690.7,
"r_x2": 212.8,
"r_y2": 682.6,
"r_x3": 171.4,
"r_y3": 682.6,
"coord_origin": "TOPLEFT"
},
"text": ", 2021. 2, 3",
"orig": ", 2021. 2, 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 702.0,
"r_x1": 66.5,
"r_y1": 702.0,
"r_x2": 66.5,
"r_y2": 694.0,
"r_x3": 50.1,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "[37]",
"orig": "[37]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 69.0,
"r_y0": 702.0,
"r_x1": 81.0,
"r_y1": 702.0,
"r_x2": 81.0,
"r_y2": 694.0,
"r_x3": 69.0,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Xu",
"orig": "Xu",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.1,
"r_y0": 702.0,
"r_x1": 114.7,
"r_y1": 702.0,
"r_x2": 114.7,
"r_y2": 694.0,
"r_x3": 89.1,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Zhong,",
"orig": "Zhong,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 124.2,
"r_y0": 702.0,
"r_x1": 149.1,
"r_y1": 702.0,
"r_x2": 149.1,
"r_y2": 694.0,
"r_x3": 124.2,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Elaheh",
"orig": "Elaheh",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 157.2,
"r_y0": 702.0,
"r_x1": 209.4,
"r_y1": 702.0,
"r_x2": 209.4,
"r_y2": 694.0,
"r_x3": 157.2,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "ShafieiBavani,",
"orig": "ShafieiBavani,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.9,
"r_y0": 702.0,
"r_x1": 231.9,
"r_y1": 702.0,
"r_x2": 231.9,
"r_y2": 694.0,
"r_x3": 218.9,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.9,
"r_y0": 702.0,
"r_x1": 269.3,
"r_y1": 702.0,
"r_x2": 269.3,
"r_y2": 694.0,
"r_x3": 239.9,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Antonio",
"orig": "Antonio",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 277.4,
"r_y0": 702.0,
"r_x1": 286.4,
"r_y1": 702.0,
"r_x2": 286.4,
"r_y2": 694.0,
"r_x3": 277.4,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Ji-",
"orig": "Ji-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 712.9,
"r_x1": 286.4,
"r_y1": 712.9,
"r_x2": 286.4,
"r_y2": 704.9,
"r_x3": 70.0,
"r_y3": 704.9,
"coord_origin": "TOPLEFT"
},
"text": "meno Yepes. Image-based table recognition: Data, model,",
"orig": "meno Yepes. Image-based table recognition: Data, model,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 83.9,
"r_x1": 545.1,
"r_y1": 83.9,
"r_x2": 545.1,
"r_y2": 75.9,
"r_x3": 328.8,
"r_y3": 75.9,
"coord_origin": "TOPLEFT"
},
"text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas",
"orig": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 94.9,
"r_x1": 472.3,
"r_y1": 94.9,
"r_x2": 472.3,
"r_y2": 86.8,
"r_x3": 328.8,
"r_y3": 86.8,
"coord_origin": "TOPLEFT"
},
"text": "Brox, and Jan-Michael Frahm, editors,",
"orig": "Brox, and Jan-Michael Frahm, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 475.9,
"r_y0": 94.7,
"r_x1": 545.1,
"r_y1": 94.7,
"r_x2": 545.1,
"r_y2": 86.9,
"r_x3": 475.9,
"r_y3": 86.9,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision -",
"orig": "Computer Vision -",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 105.6,
"r_x1": 371.9,
"r_y1": 105.6,
"r_x2": 371.9,
"r_y2": 97.9,
"r_x3": 328.8,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "ECCV 2020",
"orig": "ECCV 2020",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 371.9,
"r_y0": 105.8,
"r_x1": 545.1,
"r_y1": 105.8,
"r_x2": 545.1,
"r_y2": 97.8,
"r_x3": 371.9,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 564-580, Cham, 2020. Springer Interna-",
"orig": ", pages 564-580, Cham, 2020. Springer Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 116.8,
"r_x1": 417.7,
"r_y1": 116.8,
"r_x2": 417.7,
"r_y2": 108.8,
"r_x3": 328.8,
"r_y3": 108.8,
"coord_origin": "TOPLEFT"
},
"text": "tional Publishing. 2, 3, 7",
"orig": "tional Publishing. 2, 3, 7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 128.7,
"r_x1": 324.3,
"r_y1": 128.7,
"r_x2": 324.3,
"r_y2": 120.7,
"r_x3": 308.9,
"r_y3": 120.7,
"coord_origin": "TOPLEFT"
},
"text": "[38]",
"orig": "[38]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.7,
"r_y0": 128.7,
"r_x1": 545.1,
"r_y1": 128.7,
"r_x2": 545.1,
"r_y2": 120.7,
"r_x3": 326.7,
"r_y3": 120.7,
"coord_origin": "TOPLEFT"
},
"text": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-",
"orig": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 139.7,
"r_x1": 545.1,
"r_y1": 139.7,
"r_x2": 545.1,
"r_y2": 131.7,
"r_x3": 328.8,
"r_y3": 131.7,
"coord_origin": "TOPLEFT"
},
"text": "laynet: Largest dataset ever for document layout analysis. In",
"orig": "laynet: Largest dataset ever for document layout analysis. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 150.4,
"r_x1": 545.1,
"r_y1": 150.4,
"r_x2": 545.1,
"r_y2": 142.7,
"r_x3": 328.8,
"r_y3": 142.7,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 161.4,
"r_x1": 406.3,
"r_y1": 161.4,
"r_x2": 406.3,
"r_y2": 153.7,
"r_x3": 328.8,
"r_y3": 153.7,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.3,
"r_y0": 161.6,
"r_x1": 506.2,
"r_y1": 161.6,
"r_x2": 506.2,
"r_y2": 153.6,
"r_x3": 406.3,
"r_y3": 153.6,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1015-1022, 2019. 1",
"orig": ", pages 1015-1022, 2019. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 15,
"label": "text",
"bbox": {
"l": 70.0,
"t": 75.9,
"r": 286.4,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.69,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 83.7,
"r_x1": 223.6,
"r_y1": 83.7,
"r_x2": 223.6,
"r_y2": 76.0,
"r_x3": 70.0,
"r_y3": 76.0,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision and Pattern Recognition",
"orig": "Computer Vision and Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 223.6,
"r_y0": 83.9,
"r_x1": 286.4,
"r_y1": 83.9,
"r_x2": 286.4,
"r_y2": 75.9,
"r_x3": 223.6,
"r_y3": 75.9,
"coord_origin": "TOPLEFT"
},
"text": ", pages 658-666,",
"orig": ", pages 658-666,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 94.9,
"r_x1": 97.9,
"r_y1": 94.9,
"r_x2": 97.9,
"r_y2": 86.8,
"r_x3": 70.0,
"r_y3": 86.8,
"coord_origin": "TOPLEFT"
},
"text": "2019. 6",
"orig": "2019. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 13,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 98.2,
"r": 286.4,
"b": 161.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.77,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 106.2,
"r_x1": 65.5,
"r_y1": 106.2,
"r_x2": 65.5,
"r_y2": 98.2,
"r_x3": 50.1,
"r_y3": 98.2,
"coord_origin": "TOPLEFT"
},
"text": "[26]",
"orig": "[26]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 106.2,
"r_x1": 286.4,
"r_y1": 106.2,
"r_x2": 286.4,
"r_y2": 98.2,
"r_x3": 67.8,
"r_y3": 98.2,
"coord_origin": "TOPLEFT"
},
"text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 117.1,
"r_x1": 286.4,
"r_y1": 117.1,
"r_x2": 286.4,
"r_y2": 109.1,
"r_x3": 70.0,
"r_y3": 109.1,
"coord_origin": "TOPLEFT"
},
"text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-",
"orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 128.1,
"r_x1": 286.4,
"r_y1": 128.1,
"r_x2": 286.4,
"r_y2": 120.1,
"r_x3": 70.0,
"r_y3": 120.1,
"coord_origin": "TOPLEFT"
},
"text": "tion and structure recognition of tables in document images.",
"orig": "tion and structure recognition of tables in document images.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 139.1,
"r_x1": 77.5,
"r_y1": 139.1,
"r_x2": 77.5,
"r_y2": 131.0,
"r_x3": 70.0,
"r_y3": 131.0,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 80.6,
"r_y0": 138.9,
"r_x1": 286.4,
"r_y1": 138.9,
"r_x2": 286.4,
"r_y2": 131.1,
"r_x3": 80.6,
"r_y3": 131.1,
"coord_origin": "TOPLEFT"
},
"text": "2017 14th IAPR International Conference on Document",
"orig": "2017 14th IAPR International Conference on Document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 149.8,
"r_x1": 195.2,
"r_y1": 149.8,
"r_x2": 195.2,
"r_y2": 142.1,
"r_x3": 70.0,
"r_y3": 142.1,
"coord_origin": "TOPLEFT"
},
"text": "Analysis and Recognition (ICDAR)",
"orig": "Analysis and Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 195.2,
"r_y0": 150.0,
"r_x1": 286.4,
"r_y1": 150.0,
"r_x2": 286.4,
"r_y2": 142.0,
"r_x3": 195.2,
"r_y3": 142.0,
"coord_origin": "TOPLEFT"
},
"text": ", volume 01, pages 1162-",
"orig": ", volume 01, pages 1162-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 161.0,
"r_x1": 120.3,
"r_y1": 161.0,
"r_x2": 120.3,
"r_y2": 153.0,
"r_x3": 70.0,
"r_y3": 153.0,
"coord_origin": "TOPLEFT"
},
"text": "1167, 2017. 1",
"orig": "1167, 2017. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 164.3,
"r": 286.4,
"b": 227.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.86,
"cells": [
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 172.3,
"r_x1": 65.5,
"r_y1": 172.3,
"r_x2": 65.5,
"r_y2": 164.3,
"r_x3": 50.1,
"r_y3": 164.3,
"coord_origin": "TOPLEFT"
},
"text": "[27]",
"orig": "[27]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 172.3,
"r_x1": 286.4,
"r_y1": 172.3,
"r_x2": 286.4,
"r_y2": 164.3,
"r_x3": 67.8,
"r_y3": 164.3,
"coord_origin": "TOPLEFT"
},
"text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 183.3,
"r_x1": 286.4,
"r_y1": 183.3,
"r_x2": 286.4,
"r_y2": 175.2,
"r_x3": 70.0,
"r_y3": 175.2,
"coord_origin": "TOPLEFT"
},
"text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-",
"orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 194.2,
"r_x1": 286.4,
"r_y1": 194.2,
"r_x2": 286.4,
"r_y2": 186.2,
"r_x3": 70.0,
"r_y3": 186.2,
"coord_origin": "TOPLEFT"
},
"text": "tection and structure recognition of tables in document im-",
"orig": "tection and structure recognition of tables in document im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 205.2,
"r_x1": 101.3,
"r_y1": 205.2,
"r_x2": 101.3,
"r_y2": 197.2,
"r_x3": 70.0,
"r_y3": 197.2,
"coord_origin": "TOPLEFT"
},
"text": "ages. In",
"orig": "ages. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 104.3,
"r_y0": 205.0,
"r_x1": 286.4,
"r_y1": 205.0,
"r_x2": 286.4,
"r_y2": 197.2,
"r_x3": 104.3,
"r_y3": 197.2,
"coord_origin": "TOPLEFT"
},
"text": "2017 14th IAPR international conference on doc-",
"orig": "2017 14th IAPR international conference on doc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 215.9,
"r_x1": 220.5,
"r_y1": 215.9,
"r_x2": 220.5,
"r_y2": 208.2,
"r_x3": 70.0,
"r_y3": 208.2,
"coord_origin": "TOPLEFT"
},
"text": "ument analysis and recognition (ICDAR)",
"orig": "ument analysis and recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.5,
"r_y0": 216.1,
"r_x1": 286.4,
"r_y1": 216.1,
"r_x2": 286.4,
"r_y2": 208.1,
"r_x3": 220.5,
"r_y3": 208.1,
"coord_origin": "TOPLEFT"
},
"text": ", volume 1, pages",
"orig": ", volume 1, pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 227.1,
"r_x1": 166.7,
"r_y1": 227.1,
"r_x2": 166.7,
"r_y2": 219.1,
"r_x3": 70.0,
"r_y3": 219.1,
"coord_origin": "TOPLEFT"
},
"text": "1162-1167. IEEE, 2017. 3",
"orig": "1162-1167. IEEE, 2017. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 230.4,
"r": 286.4,
"b": 271.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.85,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 238.4,
"r_x1": 65.7,
"r_y1": 238.4,
"r_x2": 65.7,
"r_y2": 230.4,
"r_x3": 50.1,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "[28]",
"orig": "[28]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.0,
"r_y0": 238.4,
"r_x1": 286.4,
"r_y1": 238.4,
"r_x2": 286.4,
"r_y2": 230.4,
"r_x3": 68.0,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "Faisal Shafait and Ray Smith. Table detection in heteroge-",
"orig": "Faisal Shafait and Ray Smith. Table detection in heteroge-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 249.4,
"r_x1": 147.2,
"r_y1": 249.4,
"r_x2": 147.2,
"r_y2": 241.4,
"r_x3": 70.0,
"r_y3": 241.4,
"coord_origin": "TOPLEFT"
},
"text": "neous documents. In",
"orig": "neous documents. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 149.9,
"r_y0": 249.2,
"r_x1": 286.4,
"r_y1": 249.2,
"r_x2": 286.4,
"r_y2": 241.4,
"r_x3": 149.9,
"r_y3": 241.4,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the 9th IAPR Interna-",
"orig": "Proceedings of the 9th IAPR Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 260.1,
"r_x1": 244.7,
"r_y1": 260.1,
"r_x2": 244.7,
"r_y2": 252.4,
"r_x3": 70.0,
"r_y3": 252.4,
"coord_origin": "TOPLEFT"
},
"text": "tional Workshop on Document Analysis Systems",
"orig": "tional Workshop on Document Analysis Systems",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 244.7,
"r_y0": 260.3,
"r_x1": 286.4,
"r_y1": 260.3,
"r_x2": 286.4,
"r_y2": 252.3,
"r_x3": 244.7,
"r_y3": 252.3,
"coord_origin": "TOPLEFT"
},
"text": ", pages 65-",
"orig": ", pages 65-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 271.3,
"r_x1": 111.4,
"r_y1": 271.3,
"r_x2": 111.4,
"r_y2": 263.3,
"r_x3": 70.0,
"r_y3": 263.3,
"coord_origin": "TOPLEFT"
},
"text": "72, 2010. 2",
"orig": "72, 2010. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 5,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 274.6,
"r": 286.4,
"b": 326.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.85,
"cells": [
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 282.6,
"r_x1": 66.0,
"r_y1": 282.6,
"r_x2": 66.0,
"r_y2": 274.6,
"r_x3": 50.1,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "[29]",
"orig": "[29]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.4,
"r_y0": 282.6,
"r_x1": 94.9,
"r_y1": 282.6,
"r_x2": 94.9,
"r_y2": 274.6,
"r_x3": 68.4,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Shoaib",
"orig": "Shoaib",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 100.9,
"r_y0": 282.6,
"r_x1": 127.3,
"r_y1": 282.6,
"r_x2": 127.3,
"r_y2": 274.6,
"r_x3": 100.9,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Ahmed",
"orig": "Ahmed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 133.2,
"r_y0": 282.6,
"r_x1": 165.8,
"r_y1": 282.6,
"r_x2": 165.8,
"r_y2": 274.6,
"r_x3": 133.2,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Siddiqui,",
"orig": "Siddiqui,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 172.7,
"r_y0": 282.6,
"r_x1": 194.1,
"r_y1": 282.6,
"r_x2": 194.1,
"r_y2": 274.6,
"r_x3": 172.7,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Imran",
"orig": "Imran",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.0,
"r_y0": 282.6,
"r_x1": 211.5,
"r_y1": 282.6,
"r_x2": 211.5,
"r_y2": 274.6,
"r_x3": 200.0,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Ali",
"orig": "Ali",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 217.4,
"r_y0": 282.6,
"r_x1": 239.4,
"r_y1": 282.6,
"r_x2": 239.4,
"r_y2": 274.6,
"r_x3": 217.4,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Fateh,",
"orig": "Fateh,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.3,
"r_y0": 282.6,
"r_x1": 264.2,
"r_y1": 282.6,
"r_x2": 264.2,
"r_y2": 274.6,
"r_x3": 246.3,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Syed",
"orig": "Syed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 270.1,
"r_y0": 282.6,
"r_x1": 286.4,
"r_y1": 282.6,
"r_x2": 286.4,
"r_y2": 274.6,
"r_x3": 270.1,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Tah-",
"orig": "Tah-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 293.6,
"r_x1": 286.4,
"r_y1": 293.6,
"r_x2": 286.4,
"r_y2": 285.6,
"r_x3": 70.0,
"r_y3": 285.6,
"coord_origin": "TOPLEFT"
},
"text": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.",
"orig": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 304.5,
"r_x1": 286.4,
"r_y1": 304.5,
"r_x2": 286.4,
"r_y2": 296.5,
"r_x3": 70.0,
"r_y3": 296.5,
"coord_origin": "TOPLEFT"
},
"text": "Deeptabstr: Deep learning based table structure recognition.",
"orig": "Deeptabstr: Deep learning based table structure recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 315.5,
"r_x1": 77.5,
"r_y1": 315.5,
"r_x2": 77.5,
"r_y2": 307.5,
"r_x3": 70.0,
"r_y3": 307.5,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 79.4,
"r_y0": 315.3,
"r_x1": 286.4,
"r_y1": 315.3,
"r_x2": 286.4,
"r_y2": 307.6,
"r_x3": 79.4,
"r_y3": 307.6,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 326.2,
"r_x1": 147.6,
"r_y1": 326.2,
"r_x2": 147.6,
"r_y2": 318.5,
"r_x3": 70.0,
"r_y3": 318.5,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 147.6,
"r_y0": 326.5,
"r_x1": 271.3,
"r_y1": 326.5,
"r_x2": 271.3,
"r_y2": 318.4,
"r_x3": 147.6,
"r_y3": 318.4,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1403-1409. IEEE, 2019. 3",
"orig": ", pages 1403-1409. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 329.8,
"r": 286.4,
"b": 381.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.86,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 337.8,
"r_x1": 65.4,
"r_y1": 337.8,
"r_x2": 65.4,
"r_y2": 329.8,
"r_x3": 50.1,
"r_y3": 329.8,
"coord_origin": "TOPLEFT"
},
"text": "[30]",
"orig": "[30]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.7,
"r_y0": 337.8,
"r_x1": 286.4,
"r_y1": 337.8,
"r_x2": 286.4,
"r_y2": 329.8,
"r_x3": 67.7,
"r_y3": 329.8,
"coord_origin": "TOPLEFT"
},
"text": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas",
"orig": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 348.7,
"r_x1": 286.4,
"r_y1": 348.7,
"r_x2": 286.4,
"r_y2": 340.7,
"r_x3": 70.0,
"r_y3": 340.7,
"coord_origin": "TOPLEFT"
},
"text": "Bekas. Corpus conversion service: A machine learning plat-",
"orig": "Bekas. Corpus conversion service: A machine learning plat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 359.7,
"r_x1": 198.8,
"r_y1": 359.7,
"r_x2": 198.8,
"r_y2": 351.7,
"r_x3": 70.0,
"r_y3": 351.7,
"coord_origin": "TOPLEFT"
},
"text": "form to ingest documents at scale.",
"orig": "form to ingest documents at scale.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.1,
"r_y0": 359.7,
"r_x1": 213.5,
"r_y1": 359.7,
"r_x2": 213.5,
"r_y2": 351.7,
"r_x3": 206.1,
"r_y3": 351.7,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 217.0,
"r_y0": 359.5,
"r_x1": 286.4,
"r_y1": 359.5,
"r_x2": 286.4,
"r_y2": 351.8,
"r_x3": 217.0,
"r_y3": 351.8,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the",
"orig": "Proceedings of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 370.4,
"r_x1": 143.1,
"r_y1": 370.4,
"r_x2": 143.1,
"r_y2": 362.7,
"r_x3": 70.0,
"r_y3": 362.7,
"coord_origin": "TOPLEFT"
},
"text": "24th ACM SIGKDD",
"orig": "24th ACM SIGKDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.1,
"r_y0": 370.7,
"r_x1": 286.4,
"r_y1": 370.7,
"r_x2": 286.4,
"r_y2": 362.6,
"r_x3": 143.1,
"r_y3": 362.6,
"coord_origin": "TOPLEFT"
},
"text": ", KDD \u201918, pages 774-782, New York,",
"orig": ", KDD \u201918, pages 774-782, New York,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 381.6,
"r_x1": 161.2,
"r_y1": 381.6,
"r_x2": 161.2,
"r_y2": 373.6,
"r_x3": 70.0,
"r_y3": 373.6,
"coord_origin": "TOPLEFT"
},
"text": "NY, USA, 2018. ACM. 1",
"orig": "NY, USA, 2018. ACM. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 384.9,
"r": 286.4,
"b": 458.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 392.9,
"r_x1": 65.1,
"r_y1": 392.9,
"r_x2": 65.1,
"r_y2": 384.9,
"r_x3": 50.1,
"r_y3": 384.9,
"coord_origin": "TOPLEFT"
},
"text": "[31]",
"orig": "[31]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.4,
"r_y0": 392.9,
"r_x1": 286.4,
"r_y1": 392.9,
"r_x2": 286.4,
"r_y2": 384.9,
"r_x3": 67.4,
"r_y3": 384.9,
"coord_origin": "TOPLEFT"
},
"text": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-",
"orig": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 403.9,
"r_x1": 286.4,
"r_y1": 403.9,
"r_x2": 286.4,
"r_y2": 395.9,
"r_x3": 70.0,
"r_y3": 395.9,
"coord_origin": "TOPLEFT"
},
"text": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-",
"orig": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 414.9,
"r_x1": 125.5,
"r_y1": 414.9,
"r_x2": 125.5,
"r_y2": 406.8,
"r_x3": 70.0,
"r_y3": 406.8,
"coord_origin": "TOPLEFT"
},
"text": "lia Polosukhin.",
"orig": "lia Polosukhin.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 133.9,
"r_y0": 414.9,
"r_x1": 230.8,
"r_y1": 414.9,
"r_x2": 230.8,
"r_y2": 406.8,
"r_x3": 133.9,
"r_y3": 406.8,
"coord_origin": "TOPLEFT"
},
"text": "Attention is all you need.",
"orig": "Attention is all you need.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.3,
"r_y0": 414.9,
"r_x1": 286.4,
"r_y1": 414.9,
"r_x2": 286.4,
"r_y2": 406.8,
"r_x3": 239.3,
"r_y3": 406.8,
"coord_origin": "TOPLEFT"
},
"text": "In I. Guyon,",
"orig": "In I. Guyon,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 425.8,
"r_x1": 79.0,
"r_y1": 425.8,
"r_x2": 79.0,
"r_y2": 417.8,
"r_x3": 70.0,
"r_y3": 417.8,
"coord_origin": "TOPLEFT"
},
"text": "U.",
"orig": "U.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.3,
"r_y0": 425.8,
"r_x1": 286.4,
"r_y1": 425.8,
"r_x2": 286.4,
"r_y2": 417.8,
"r_x3": 81.3,
"r_y3": 417.8,
"coord_origin": "TOPLEFT"
},
"text": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-",
"orig": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 436.8,
"r_x1": 196.8,
"r_y1": 436.8,
"r_x2": 196.8,
"r_y2": 428.8,
"r_x3": 70.0,
"r_y3": 428.8,
"coord_origin": "TOPLEFT"
},
"text": "wanathan, and R. Garnett, editors,",
"orig": "wanathan, and R. Garnett, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.2,
"r_y0": 436.6,
"r_x1": 286.4,
"r_y1": 436.6,
"r_x2": 286.4,
"r_y2": 428.8,
"r_x3": 200.2,
"r_y3": 428.8,
"coord_origin": "TOPLEFT"
},
"text": "Advances in Neural In-",
"orig": "Advances in Neural In-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 447.5,
"r_x1": 189.2,
"r_y1": 447.5,
"r_x2": 189.2,
"r_y2": 439.8,
"r_x3": 70.0,
"r_y3": 439.8,
"coord_origin": "TOPLEFT"
},
"text": "formation Processing Systems 30",
"orig": "formation Processing Systems 30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.2,
"r_y0": 447.7,
"r_x1": 286.4,
"r_y1": 447.7,
"r_x2": 286.4,
"r_y2": 439.7,
"r_x3": 189.2,
"r_y3": 439.7,
"coord_origin": "TOPLEFT"
},
"text": ", pages 5998-6008. Curran",
"orig": ", pages 5998-6008. Curran",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 458.7,
"r_x1": 158.9,
"r_y1": 458.7,
"r_x2": 158.9,
"r_y2": 450.7,
"r_x3": 70.0,
"r_y3": 450.7,
"coord_origin": "TOPLEFT"
},
"text": "Associates, Inc., 2017. 5",
"orig": "Associates, Inc., 2017. 5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 6,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 462.0,
"r": 286.4,
"b": 502.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 470.0,
"r_x1": 65.9,
"r_y1": 470.0,
"r_x2": 65.9,
"r_y2": 462.0,
"r_x3": 50.1,
"r_y3": 462.0,
"coord_origin": "TOPLEFT"
},
"text": "[32]",
"orig": "[32]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.3,
"r_y0": 470.0,
"r_x1": 286.4,
"r_y1": 470.0,
"r_x2": 286.4,
"r_y2": 462.0,
"r_x3": 68.3,
"r_y3": 462.0,
"coord_origin": "TOPLEFT"
},
"text": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-",
"orig": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 481.0,
"r_x1": 116.3,
"r_y1": 481.0,
"r_x2": 116.3,
"r_y2": 473.0,
"r_x3": 70.0,
"r_y3": 473.0,
"coord_origin": "TOPLEFT"
},
"text": "mitru Erhan.",
"orig": "mitru Erhan.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.5,
"r_y0": 481.0,
"r_x1": 286.4,
"r_y1": 481.0,
"r_x2": 286.4,
"r_y2": 473.0,
"r_x3": 122.5,
"r_y3": 473.0,
"coord_origin": "TOPLEFT"
},
"text": "Show and tell: A neural image caption gen-",
"orig": "Show and tell: A neural image caption gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 491.9,
"r_x1": 103.3,
"r_y1": 491.9,
"r_x2": 103.3,
"r_y2": 483.9,
"r_x3": 70.0,
"r_y3": 483.9,
"coord_origin": "TOPLEFT"
},
"text": "erator. In",
"orig": "erator. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 105.5,
"r_y0": 491.7,
"r_x1": 286.4,
"r_y1": 491.7,
"r_x2": 286.4,
"r_y2": 484.0,
"r_x3": 105.5,
"r_y3": 484.0,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE Conference on Computer",
"orig": "Proceedings of the IEEE Conference on Computer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 502.7,
"r_x1": 212.5,
"r_y1": 502.7,
"r_x2": 212.5,
"r_y2": 495.0,
"r_x3": 70.0,
"r_y3": 495.0,
"coord_origin": "TOPLEFT"
},
"text": "Vision and Pattern Recognition (CVPR)",
"orig": "Vision and Pattern Recognition (CVPR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 212.5,
"r_y0": 502.9,
"r_x1": 263.6,
"r_y1": 502.9,
"r_x2": 263.6,
"r_y2": 494.9,
"r_x3": 212.5,
"r_y3": 494.9,
"coord_origin": "TOPLEFT"
},
"text": ", June 2015. 2",
"orig": ", June 2015. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 7,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 506.2,
"r": 286.4,
"b": 547.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 514.2,
"r_x1": 65.7,
"r_y1": 514.2,
"r_x2": 65.7,
"r_y2": 506.2,
"r_x3": 50.1,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "[33]",
"orig": "[33]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.0,
"r_y0": 514.2,
"r_x1": 247.4,
"r_y1": 514.2,
"r_x2": 247.4,
"r_y2": 506.2,
"r_x3": 68.0,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.",
"orig": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 254.0,
"r_y0": 514.2,
"r_x1": 286.4,
"r_y1": 514.2,
"r_x2": 286.4,
"r_y2": 506.2,
"r_x3": 254.0,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "Res2tim:",
"orig": "Res2tim:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 525.2,
"r_x1": 265.6,
"r_y1": 525.2,
"r_x2": 265.6,
"r_y2": 517.2,
"r_x3": 70.0,
"r_y3": 517.2,
"coord_origin": "TOPLEFT"
},
"text": "reconstruct syntactic structures from table images. In",
"orig": "reconstruct syntactic structures from table images. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 268.4,
"r_y0": 525.0,
"r_x1": 286.4,
"r_y1": 525.0,
"r_x2": 286.4,
"r_y2": 517.2,
"r_x3": 268.4,
"r_y3": 517.2,
"coord_origin": "TOPLEFT"
},
"text": "2019",
"orig": "2019",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 535.9,
"r_x1": 286.4,
"r_y1": 535.9,
"r_x2": 286.4,
"r_y2": 528.2,
"r_x3": 70.0,
"r_y3": 528.2,
"coord_origin": "TOPLEFT"
},
"text": "International Conference on Document Analysis and Recog-",
"orig": "International Conference on Document Analysis and Recog-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 546.9,
"r_x1": 125.3,
"r_y1": 546.9,
"r_x2": 125.3,
"r_y2": 539.2,
"r_x3": 70.0,
"r_y3": 539.2,
"coord_origin": "TOPLEFT"
},
"text": "nition (ICDAR)",
"orig": "nition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.3,
"r_y0": 547.1,
"r_x1": 240.1,
"r_y1": 547.1,
"r_x2": 240.1,
"r_y2": 539.1,
"r_x3": 125.3,
"r_y3": 539.1,
"coord_origin": "TOPLEFT"
},
"text": ", pages 749-755. IEEE, 2019. 3",
"orig": ", pages 749-755. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 11,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 550.4,
"r": 286.4,
"b": 591.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.82,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 558.4,
"r_x1": 66.0,
"r_y1": 558.4,
"r_x2": 66.0,
"r_y2": 550.4,
"r_x3": 50.1,
"r_y3": 550.4,
"coord_origin": "TOPLEFT"
},
"text": "[34]",
"orig": "[34]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.4,
"r_y0": 558.4,
"r_x1": 286.4,
"r_y1": 558.4,
"r_x2": 286.4,
"r_y2": 550.4,
"r_x3": 68.4,
"r_y3": 550.4,
"coord_origin": "TOPLEFT"
},
"text": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,",
"orig": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 569.4,
"r_x1": 137.1,
"r_y1": 569.4,
"r_x2": 137.1,
"r_y2": 561.4,
"r_x3": 70.0,
"r_y3": 561.4,
"coord_origin": "TOPLEFT"
},
"text": "and Qingyong Li.",
"orig": "and Qingyong Li.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 146.0,
"r_y0": 569.4,
"r_x1": 172.4,
"r_y1": 569.4,
"r_x2": 172.4,
"r_y2": 561.4,
"r_x3": 146.0,
"r_y3": 561.4,
"coord_origin": "TOPLEFT"
},
"text": "Tgrnet:",
"orig": "Tgrnet:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 178.7,
"r_y0": 569.4,
"r_x1": 286.4,
"r_y1": 569.4,
"r_x2": 286.4,
"r_y2": 561.4,
"r_x3": 178.7,
"r_y3": 561.4,
"coord_origin": "TOPLEFT"
},
"text": "A table graph reconstruction",
"orig": "A table graph reconstruction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 580.3,
"r_x1": 221.0,
"r_y1": 580.3,
"r_x2": 221.0,
"r_y2": 572.3,
"r_x3": 70.0,
"r_y3": 572.3,
"coord_origin": "TOPLEFT"
},
"text": "network for table structure recognition.",
"orig": "network for table structure recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.5,
"r_y0": 580.1,
"r_x1": 286.4,
"r_y1": 580.1,
"r_x2": 286.4,
"r_y2": 572.4,
"r_x3": 232.5,
"r_y3": 572.4,
"coord_origin": "TOPLEFT"
},
"text": "arXiv preprint",
"orig": "arXiv preprint",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 591.1,
"r_x1": 135.5,
"r_y1": 591.1,
"r_x2": 135.5,
"r_y2": 583.4,
"r_x3": 70.0,
"r_y3": 583.4,
"coord_origin": "TOPLEFT"
},
"text": "arXiv:2106.10598",
"orig": "arXiv:2106.10598",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 135.5,
"r_y0": 591.3,
"r_x1": 167.9,
"r_y1": 591.3,
"r_x2": 167.9,
"r_y2": 583.3,
"r_x3": 135.5,
"r_y3": 583.3,
"coord_origin": "TOPLEFT"
},
"text": ", 2021. 3",
"orig": ", 2021. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 10,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 594.6,
"r": 286.4,
"b": 635.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 602.6,
"r_x1": 65.2,
"r_y1": 602.6,
"r_x2": 65.2,
"r_y2": 594.6,
"r_x3": 50.1,
"r_y3": 594.6,
"coord_origin": "TOPLEFT"
},
"text": "[35]",
"orig": "[35]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.5,
"r_y0": 602.6,
"r_x1": 286.4,
"r_y1": 602.6,
"r_x2": 286.4,
"r_y2": 594.6,
"r_x3": 67.5,
"r_y3": 594.6,
"coord_origin": "TOPLEFT"
},
"text": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and",
"orig": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 613.6,
"r_x1": 109.1,
"r_y1": 613.6,
"r_x2": 109.1,
"r_y2": 605.6,
"r_x3": 70.0,
"r_y3": 605.6,
"coord_origin": "TOPLEFT"
},
"text": "Jiebo Luo.",
"orig": "Jiebo Luo.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.2,
"r_y0": 613.6,
"r_x1": 271.8,
"r_y1": 613.6,
"r_x2": 271.8,
"r_y2": 605.6,
"r_x3": 116.2,
"r_y3": 605.6,
"coord_origin": "TOPLEFT"
},
"text": "Image captioning with semantic attention.",
"orig": "Image captioning with semantic attention.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.9,
"r_y0": 613.6,
"r_x1": 286.4,
"r_y1": 613.6,
"r_x2": 286.4,
"r_y2": 605.6,
"r_x3": 278.9,
"r_y3": 605.6,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 624.3,
"r_x1": 286.4,
"r_y1": 624.3,
"r_x2": 286.4,
"r_y2": 616.6,
"r_x3": 70.0,
"r_y3": 616.6,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE conference on computer vision and",
"orig": "Proceedings of the IEEE conference on computer vision and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 635.3,
"r_x1": 139.1,
"r_y1": 635.3,
"r_x2": 139.1,
"r_y2": 627.6,
"r_x3": 70.0,
"r_y3": 627.6,
"coord_origin": "TOPLEFT"
},
"text": "pattern recognition",
"orig": "pattern recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 139.1,
"r_y0": 635.5,
"r_x1": 239.0,
"r_y1": 635.5,
"r_x2": 239.0,
"r_y2": 627.5,
"r_x3": 139.1,
"r_y3": 627.5,
"coord_origin": "TOPLEFT"
},
"text": ", pages 4651-4659, 2016. 4",
"orig": ", pages 4651-4659, 2016. 4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 12,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 638.8,
"r": 286.4,
"b": 690.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.81,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 646.8,
"r_x1": 65.2,
"r_y1": 646.8,
"r_x2": 65.2,
"r_y2": 638.8,
"r_x3": 50.1,
"r_y3": 638.8,
"coord_origin": "TOPLEFT"
},
"text": "[36]",
"orig": "[36]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.5,
"r_y0": 646.8,
"r_x1": 286.4,
"r_y1": 646.8,
"r_x2": 286.4,
"r_y2": 638.8,
"r_x3": 67.5,
"r_y3": 638.8,
"coord_origin": "TOPLEFT"
},
"text": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and",
"orig": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 657.8,
"r_x1": 286.4,
"r_y1": 657.8,
"r_x2": 286.4,
"r_y2": 649.8,
"r_x3": 70.0,
"r_y3": 649.8,
"coord_origin": "TOPLEFT"
},
"text": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-",
"orig": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 668.7,
"r_x1": 286.4,
"r_y1": 668.7,
"r_x2": 286.4,
"r_y2": 660.7,
"r_x3": 70.0,
"r_y3": 660.7,
"coord_origin": "TOPLEFT"
},
"text": "work for joint table identification and cell structure recogni-",
"orig": "work for joint table identification and cell structure recogni-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 679.7,
"r_x1": 158.5,
"r_y1": 679.7,
"r_x2": 158.5,
"r_y2": 671.7,
"r_x3": 70.0,
"r_y3": 671.7,
"coord_origin": "TOPLEFT"
},
"text": "tion using visual context.",
"orig": "tion using visual context.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.5,
"r_y0": 679.5,
"r_x1": 286.4,
"r_y1": 679.5,
"r_x2": 286.4,
"r_y2": 671.8,
"r_x3": 160.5,
"r_y3": 671.8,
"coord_origin": "TOPLEFT"
},
"text": "Winter Conference for Applications",
"orig": "Winter Conference for Applications",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 690.4,
"r_x1": 171.4,
"r_y1": 690.4,
"r_x2": 171.4,
"r_y2": 682.7,
"r_x3": 70.0,
"r_y3": 682.7,
"coord_origin": "TOPLEFT"
},
"text": "in Computer Vision (WACV)",
"orig": "in Computer Vision (WACV)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.4,
"r_y0": 690.7,
"r_x1": 212.8,
"r_y1": 690.7,
"r_x2": 212.8,
"r_y2": 682.6,
"r_x3": 171.4,
"r_y3": 682.6,
"coord_origin": "TOPLEFT"
},
"text": ", 2021. 2, 3",
"orig": ", 2021. 2, 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 8,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 694.0,
"r": 286.4,
"b": 712.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 702.0,
"r_x1": 66.5,
"r_y1": 702.0,
"r_x2": 66.5,
"r_y2": 694.0,
"r_x3": 50.1,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "[37]",
"orig": "[37]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 69.0,
"r_y0": 702.0,
"r_x1": 81.0,
"r_y1": 702.0,
"r_x2": 81.0,
"r_y2": 694.0,
"r_x3": 69.0,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Xu",
"orig": "Xu",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.1,
"r_y0": 702.0,
"r_x1": 114.7,
"r_y1": 702.0,
"r_x2": 114.7,
"r_y2": 694.0,
"r_x3": 89.1,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Zhong,",
"orig": "Zhong,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 124.2,
"r_y0": 702.0,
"r_x1": 149.1,
"r_y1": 702.0,
"r_x2": 149.1,
"r_y2": 694.0,
"r_x3": 124.2,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Elaheh",
"orig": "Elaheh",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 157.2,
"r_y0": 702.0,
"r_x1": 209.4,
"r_y1": 702.0,
"r_x2": 209.4,
"r_y2": 694.0,
"r_x3": 157.2,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "ShafieiBavani,",
"orig": "ShafieiBavani,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.9,
"r_y0": 702.0,
"r_x1": 231.9,
"r_y1": 702.0,
"r_x2": 231.9,
"r_y2": 694.0,
"r_x3": 218.9,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.9,
"r_y0": 702.0,
"r_x1": 269.3,
"r_y1": 702.0,
"r_x2": 269.3,
"r_y2": 694.0,
"r_x3": 239.9,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Antonio",
"orig": "Antonio",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 277.4,
"r_y0": 702.0,
"r_x1": 286.4,
"r_y1": 702.0,
"r_x2": 286.4,
"r_y2": 694.0,
"r_x3": 277.4,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Ji-",
"orig": "Ji-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 712.9,
"r_x1": 286.4,
"r_y1": 712.9,
"r_x2": 286.4,
"r_y2": 704.9,
"r_x3": 70.0,
"r_y3": 704.9,
"coord_origin": "TOPLEFT"
},
"text": "meno Yepes. Image-based table recognition: Data, model,",
"orig": "meno Yepes. Image-based table recognition: Data, model,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 14,
"label": "list_item",
"bbox": {
"l": 328.8,
"t": 75.9,
"r": 545.1,
"b": 116.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.76,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 83.9,
"r_x1": 545.1,
"r_y1": 83.9,
"r_x2": 545.1,
"r_y2": 75.9,
"r_x3": 328.8,
"r_y3": 75.9,
"coord_origin": "TOPLEFT"
},
"text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas",
"orig": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 94.9,
"r_x1": 472.3,
"r_y1": 94.9,
"r_x2": 472.3,
"r_y2": 86.8,
"r_x3": 328.8,
"r_y3": 86.8,
"coord_origin": "TOPLEFT"
},
"text": "Brox, and Jan-Michael Frahm, editors,",
"orig": "Brox, and Jan-Michael Frahm, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 475.9,
"r_y0": 94.7,
"r_x1": 545.1,
"r_y1": 94.7,
"r_x2": 545.1,
"r_y2": 86.9,
"r_x3": 475.9,
"r_y3": 86.9,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision -",
"orig": "Computer Vision -",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 105.6,
"r_x1": 371.9,
"r_y1": 105.6,
"r_x2": 371.9,
"r_y2": 97.9,
"r_x3": 328.8,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "ECCV 2020",
"orig": "ECCV 2020",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 371.9,
"r_y0": 105.8,
"r_x1": 545.1,
"r_y1": 105.8,
"r_x2": 545.1,
"r_y2": 97.8,
"r_x3": 371.9,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 564-580, Cham, 2020. Springer Interna-",
"orig": ", pages 564-580, Cham, 2020. Springer Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 116.8,
"r_x1": 417.7,
"r_y1": 116.8,
"r_x2": 417.7,
"r_y2": 108.8,
"r_x3": 328.8,
"r_y3": 108.8,
"coord_origin": "TOPLEFT"
},
"text": "tional Publishing. 2, 3, 7",
"orig": "tional Publishing. 2, 3, 7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 9,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 120.7,
"r": 545.1,
"b": 161.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 128.7,
"r_x1": 324.3,
"r_y1": 128.7,
"r_x2": 324.3,
"r_y2": 120.7,
"r_x3": 308.9,
"r_y3": 120.7,
"coord_origin": "TOPLEFT"
},
"text": "[38]",
"orig": "[38]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.7,
"r_y0": 128.7,
"r_x1": 545.1,
"r_y1": 128.7,
"r_x2": 545.1,
"r_y2": 120.7,
"r_x3": 326.7,
"r_y3": 120.7,
"coord_origin": "TOPLEFT"
},
"text": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-",
"orig": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 139.7,
"r_x1": 545.1,
"r_y1": 139.7,
"r_x2": 545.1,
"r_y2": 131.7,
"r_x3": 328.8,
"r_y3": 131.7,
"coord_origin": "TOPLEFT"
},
"text": "laynet: Largest dataset ever for document layout analysis. In",
"orig": "laynet: Largest dataset ever for document layout analysis. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 150.4,
"r_x1": 545.1,
"r_y1": 150.4,
"r_x2": 545.1,
"r_y2": 142.7,
"r_x3": 328.8,
"r_y3": 142.7,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 161.4,
"r_x1": 406.3,
"r_y1": 161.4,
"r_x2": 406.3,
"r_y2": 153.7,
"r_x3": 328.8,
"r_y3": 153.7,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.3,
"r_y0": 161.6,
"r_x1": 506.2,
"r_y1": 161.6,
"r_x2": 506.2,
"r_y2": 153.6,
"r_x3": 406.3,
"r_y3": 153.6,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1015-1022, 2019. 1",
"orig": ", pages 1015-1022, 2019. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 0,
"label": "page_footer",
"bbox": {
"l": 292.6,
"t": 734.1,
"r": 302.6,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"tablestructure": {
"table_map": {}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "text",
"id": 15,
"page_no": 9,
"cluster": {
"id": 15,
"label": "text",
"bbox": {
"l": 70.0,
"t": 75.9,
"r": 286.4,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.69,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 83.7,
"r_x1": 223.6,
"r_y1": 83.7,
"r_x2": 223.6,
"r_y2": 76.0,
"r_x3": 70.0,
"r_y3": 76.0,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision and Pattern Recognition",
"orig": "Computer Vision and Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 223.6,
"r_y0": 83.9,
"r_x1": 286.4,
"r_y1": 83.9,
"r_x2": 286.4,
"r_y2": 75.9,
"r_x3": 223.6,
"r_y3": 75.9,
"coord_origin": "TOPLEFT"
},
"text": ", pages 658-666,",
"orig": ", pages 658-666,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 94.9,
"r_x1": 97.9,
"r_y1": 94.9,
"r_x2": 97.9,
"r_y2": 86.8,
"r_x3": 70.0,
"r_y3": 86.8,
"coord_origin": "TOPLEFT"
},
"text": "2019. 6",
"orig": "2019. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Computer Vision and Pattern Recognition , pages 658-666, 2019. 6"
},
{
"label": "list_item",
"id": 13,
"page_no": 9,
"cluster": {
"id": 13,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 98.2,
"r": 286.4,
"b": 161.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.77,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 106.2,
"r_x1": 65.5,
"r_y1": 106.2,
"r_x2": 65.5,
"r_y2": 98.2,
"r_x3": 50.1,
"r_y3": 98.2,
"coord_origin": "TOPLEFT"
},
"text": "[26]",
"orig": "[26]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 106.2,
"r_x1": 286.4,
"r_y1": 106.2,
"r_x2": 286.4,
"r_y2": 98.2,
"r_x3": 67.8,
"r_y3": 98.2,
"coord_origin": "TOPLEFT"
},
"text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 117.1,
"r_x1": 286.4,
"r_y1": 117.1,
"r_x2": 286.4,
"r_y2": 109.1,
"r_x3": 70.0,
"r_y3": 109.1,
"coord_origin": "TOPLEFT"
},
"text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-",
"orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 128.1,
"r_x1": 286.4,
"r_y1": 128.1,
"r_x2": 286.4,
"r_y2": 120.1,
"r_x3": 70.0,
"r_y3": 120.1,
"coord_origin": "TOPLEFT"
},
"text": "tion and structure recognition of tables in document images.",
"orig": "tion and structure recognition of tables in document images.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 139.1,
"r_x1": 77.5,
"r_y1": 139.1,
"r_x2": 77.5,
"r_y2": 131.0,
"r_x3": 70.0,
"r_y3": 131.0,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 80.6,
"r_y0": 138.9,
"r_x1": 286.4,
"r_y1": 138.9,
"r_x2": 286.4,
"r_y2": 131.1,
"r_x3": 80.6,
"r_y3": 131.1,
"coord_origin": "TOPLEFT"
},
"text": "2017 14th IAPR International Conference on Document",
"orig": "2017 14th IAPR International Conference on Document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 149.8,
"r_x1": 195.2,
"r_y1": 149.8,
"r_x2": 195.2,
"r_y2": 142.1,
"r_x3": 70.0,
"r_y3": 142.1,
"coord_origin": "TOPLEFT"
},
"text": "Analysis and Recognition (ICDAR)",
"orig": "Analysis and Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 195.2,
"r_y0": 150.0,
"r_x1": 286.4,
"r_y1": 150.0,
"r_x2": 286.4,
"r_y2": 142.0,
"r_x3": 195.2,
"r_y3": 142.0,
"coord_origin": "TOPLEFT"
},
"text": ", volume 01, pages 1162-",
"orig": ", volume 01, pages 1162-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 161.0,
"r_x1": 120.3,
"r_y1": 161.0,
"r_x2": 120.3,
"r_y2": 153.0,
"r_x3": 70.0,
"r_y3": 153.0,
"coord_origin": "TOPLEFT"
},
"text": "1167, 2017. 1",
"orig": "1167, 2017. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[26] Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Dengel, and Sheraz Ahmed. Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR) , volume 01, pages 11621167, 2017. 1"
},
{
"label": "list_item",
"id": 2,
"page_no": 9,
"cluster": {
"id": 2,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 164.3,
"r": 286.4,
"b": 227.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.86,
"cells": [
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 172.3,
"r_x1": 65.5,
"r_y1": 172.3,
"r_x2": 65.5,
"r_y2": 164.3,
"r_x3": 50.1,
"r_y3": 164.3,
"coord_origin": "TOPLEFT"
},
"text": "[27]",
"orig": "[27]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 172.3,
"r_x1": 286.4,
"r_y1": 172.3,
"r_x2": 286.4,
"r_y2": 164.3,
"r_x3": 67.8,
"r_y3": 164.3,
"coord_origin": "TOPLEFT"
},
"text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 183.3,
"r_x1": 286.4,
"r_y1": 183.3,
"r_x2": 286.4,
"r_y2": 175.2,
"r_x3": 70.0,
"r_y3": 175.2,
"coord_origin": "TOPLEFT"
},
"text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-",
"orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 194.2,
"r_x1": 286.4,
"r_y1": 194.2,
"r_x2": 286.4,
"r_y2": 186.2,
"r_x3": 70.0,
"r_y3": 186.2,
"coord_origin": "TOPLEFT"
},
"text": "tection and structure recognition of tables in document im-",
"orig": "tection and structure recognition of tables in document im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 205.2,
"r_x1": 101.3,
"r_y1": 205.2,
"r_x2": 101.3,
"r_y2": 197.2,
"r_x3": 70.0,
"r_y3": 197.2,
"coord_origin": "TOPLEFT"
},
"text": "ages. In",
"orig": "ages. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 104.3,
"r_y0": 205.0,
"r_x1": 286.4,
"r_y1": 205.0,
"r_x2": 286.4,
"r_y2": 197.2,
"r_x3": 104.3,
"r_y3": 197.2,
"coord_origin": "TOPLEFT"
},
"text": "2017 14th IAPR international conference on doc-",
"orig": "2017 14th IAPR international conference on doc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 215.9,
"r_x1": 220.5,
"r_y1": 215.9,
"r_x2": 220.5,
"r_y2": 208.2,
"r_x3": 70.0,
"r_y3": 208.2,
"coord_origin": "TOPLEFT"
},
"text": "ument analysis and recognition (ICDAR)",
"orig": "ument analysis and recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.5,
"r_y0": 216.1,
"r_x1": 286.4,
"r_y1": 216.1,
"r_x2": 286.4,
"r_y2": 208.1,
"r_x3": 220.5,
"r_y3": 208.1,
"coord_origin": "TOPLEFT"
},
"text": ", volume 1, pages",
"orig": ", volume 1, pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 227.1,
"r_x1": 166.7,
"r_y1": 227.1,
"r_x2": 166.7,
"r_y2": 219.1,
"r_x3": 70.0,
"r_y3": 219.1,
"coord_origin": "TOPLEFT"
},
"text": "1162-1167. IEEE, 2017. 3",
"orig": "1162-1167. IEEE, 2017. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[27] Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Dengel, and Sheraz Ahmed. Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In 2017 14th IAPR international conference on document analysis and recognition (ICDAR) , volume 1, pages 1162-1167. IEEE, 2017. 3"
},
{
"label": "list_item",
"id": 4,
"page_no": 9,
"cluster": {
"id": 4,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 230.4,
"r": 286.4,
"b": 271.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.85,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 238.4,
"r_x1": 65.7,
"r_y1": 238.4,
"r_x2": 65.7,
"r_y2": 230.4,
"r_x3": 50.1,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "[28]",
"orig": "[28]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.0,
"r_y0": 238.4,
"r_x1": 286.4,
"r_y1": 238.4,
"r_x2": 286.4,
"r_y2": 230.4,
"r_x3": 68.0,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "Faisal Shafait and Ray Smith. Table detection in heteroge-",
"orig": "Faisal Shafait and Ray Smith. Table detection in heteroge-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 249.4,
"r_x1": 147.2,
"r_y1": 249.4,
"r_x2": 147.2,
"r_y2": 241.4,
"r_x3": 70.0,
"r_y3": 241.4,
"coord_origin": "TOPLEFT"
},
"text": "neous documents. In",
"orig": "neous documents. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 149.9,
"r_y0": 249.2,
"r_x1": 286.4,
"r_y1": 249.2,
"r_x2": 286.4,
"r_y2": 241.4,
"r_x3": 149.9,
"r_y3": 241.4,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the 9th IAPR Interna-",
"orig": "Proceedings of the 9th IAPR Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 260.1,
"r_x1": 244.7,
"r_y1": 260.1,
"r_x2": 244.7,
"r_y2": 252.4,
"r_x3": 70.0,
"r_y3": 252.4,
"coord_origin": "TOPLEFT"
},
"text": "tional Workshop on Document Analysis Systems",
"orig": "tional Workshop on Document Analysis Systems",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 244.7,
"r_y0": 260.3,
"r_x1": 286.4,
"r_y1": 260.3,
"r_x2": 286.4,
"r_y2": 252.3,
"r_x3": 244.7,
"r_y3": 252.3,
"coord_origin": "TOPLEFT"
},
"text": ", pages 65-",
"orig": ", pages 65-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 271.3,
"r_x1": 111.4,
"r_y1": 271.3,
"r_x2": 111.4,
"r_y2": 263.3,
"r_x3": 70.0,
"r_y3": 263.3,
"coord_origin": "TOPLEFT"
},
"text": "72, 2010. 2",
"orig": "72, 2010. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[28] Faisal Shafait and Ray Smith. Table detection in heterogeneous documents. In Proceedings of the 9th IAPR International Workshop on Document Analysis Systems , pages 6572, 2010. 2"
},
{
"label": "list_item",
"id": 5,
"page_no": 9,
"cluster": {
"id": 5,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 274.6,
"r": 286.4,
"b": 326.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.85,
"cells": [
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 282.6,
"r_x1": 66.0,
"r_y1": 282.6,
"r_x2": 66.0,
"r_y2": 274.6,
"r_x3": 50.1,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "[29]",
"orig": "[29]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.4,
"r_y0": 282.6,
"r_x1": 94.9,
"r_y1": 282.6,
"r_x2": 94.9,
"r_y2": 274.6,
"r_x3": 68.4,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Shoaib",
"orig": "Shoaib",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 100.9,
"r_y0": 282.6,
"r_x1": 127.3,
"r_y1": 282.6,
"r_x2": 127.3,
"r_y2": 274.6,
"r_x3": 100.9,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Ahmed",
"orig": "Ahmed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 133.2,
"r_y0": 282.6,
"r_x1": 165.8,
"r_y1": 282.6,
"r_x2": 165.8,
"r_y2": 274.6,
"r_x3": 133.2,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Siddiqui,",
"orig": "Siddiqui,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 172.7,
"r_y0": 282.6,
"r_x1": 194.1,
"r_y1": 282.6,
"r_x2": 194.1,
"r_y2": 274.6,
"r_x3": 172.7,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Imran",
"orig": "Imran",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.0,
"r_y0": 282.6,
"r_x1": 211.5,
"r_y1": 282.6,
"r_x2": 211.5,
"r_y2": 274.6,
"r_x3": 200.0,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Ali",
"orig": "Ali",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 217.4,
"r_y0": 282.6,
"r_x1": 239.4,
"r_y1": 282.6,
"r_x2": 239.4,
"r_y2": 274.6,
"r_x3": 217.4,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Fateh,",
"orig": "Fateh,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.3,
"r_y0": 282.6,
"r_x1": 264.2,
"r_y1": 282.6,
"r_x2": 264.2,
"r_y2": 274.6,
"r_x3": 246.3,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Syed",
"orig": "Syed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 270.1,
"r_y0": 282.6,
"r_x1": 286.4,
"r_y1": 282.6,
"r_x2": 286.4,
"r_y2": 274.6,
"r_x3": 270.1,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Tah-",
"orig": "Tah-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 293.6,
"r_x1": 286.4,
"r_y1": 293.6,
"r_x2": 286.4,
"r_y2": 285.6,
"r_x3": 70.0,
"r_y3": 285.6,
"coord_origin": "TOPLEFT"
},
"text": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.",
"orig": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 304.5,
"r_x1": 286.4,
"r_y1": 304.5,
"r_x2": 286.4,
"r_y2": 296.5,
"r_x3": 70.0,
"r_y3": 296.5,
"coord_origin": "TOPLEFT"
},
"text": "Deeptabstr: Deep learning based table structure recognition.",
"orig": "Deeptabstr: Deep learning based table structure recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 315.5,
"r_x1": 77.5,
"r_y1": 315.5,
"r_x2": 77.5,
"r_y2": 307.5,
"r_x3": 70.0,
"r_y3": 307.5,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 79.4,
"r_y0": 315.3,
"r_x1": 286.4,
"r_y1": 315.3,
"r_x2": 286.4,
"r_y2": 307.6,
"r_x3": 79.4,
"r_y3": 307.6,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 326.2,
"r_x1": 147.6,
"r_y1": 326.2,
"r_x2": 147.6,
"r_y2": 318.5,
"r_x3": 70.0,
"r_y3": 318.5,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 147.6,
"r_y0": 326.5,
"r_x1": 271.3,
"r_y1": 326.5,
"r_x2": 271.3,
"r_y2": 318.4,
"r_x3": 147.6,
"r_y3": 318.4,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1403-1409. IEEE, 2019. 3",
"orig": ", pages 1403-1409. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[29] Shoaib Ahmed Siddiqui, Imran Ali Fateh, Syed Tahseen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed. Deeptabstr: Deep learning based table structure recognition. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 1403-1409. IEEE, 2019. 3"
},
{
"label": "list_item",
"id": 3,
"page_no": 9,
"cluster": {
"id": 3,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 329.8,
"r": 286.4,
"b": 381.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.86,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 337.8,
"r_x1": 65.4,
"r_y1": 337.8,
"r_x2": 65.4,
"r_y2": 329.8,
"r_x3": 50.1,
"r_y3": 329.8,
"coord_origin": "TOPLEFT"
},
"text": "[30]",
"orig": "[30]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.7,
"r_y0": 337.8,
"r_x1": 286.4,
"r_y1": 337.8,
"r_x2": 286.4,
"r_y2": 329.8,
"r_x3": 67.7,
"r_y3": 329.8,
"coord_origin": "TOPLEFT"
},
"text": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas",
"orig": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 348.7,
"r_x1": 286.4,
"r_y1": 348.7,
"r_x2": 286.4,
"r_y2": 340.7,
"r_x3": 70.0,
"r_y3": 340.7,
"coord_origin": "TOPLEFT"
},
"text": "Bekas. Corpus conversion service: A machine learning plat-",
"orig": "Bekas. Corpus conversion service: A machine learning plat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 359.7,
"r_x1": 198.8,
"r_y1": 359.7,
"r_x2": 198.8,
"r_y2": 351.7,
"r_x3": 70.0,
"r_y3": 351.7,
"coord_origin": "TOPLEFT"
},
"text": "form to ingest documents at scale.",
"orig": "form to ingest documents at scale.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.1,
"r_y0": 359.7,
"r_x1": 213.5,
"r_y1": 359.7,
"r_x2": 213.5,
"r_y2": 351.7,
"r_x3": 206.1,
"r_y3": 351.7,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 217.0,
"r_y0": 359.5,
"r_x1": 286.4,
"r_y1": 359.5,
"r_x2": 286.4,
"r_y2": 351.8,
"r_x3": 217.0,
"r_y3": 351.8,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the",
"orig": "Proceedings of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 370.4,
"r_x1": 143.1,
"r_y1": 370.4,
"r_x2": 143.1,
"r_y2": 362.7,
"r_x3": 70.0,
"r_y3": 362.7,
"coord_origin": "TOPLEFT"
},
"text": "24th ACM SIGKDD",
"orig": "24th ACM SIGKDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.1,
"r_y0": 370.7,
"r_x1": 286.4,
"r_y1": 370.7,
"r_x2": 286.4,
"r_y2": 362.6,
"r_x3": 143.1,
"r_y3": 362.6,
"coord_origin": "TOPLEFT"
},
"text": ", KDD \u201918, pages 774-782, New York,",
"orig": ", KDD \u201918, pages 774-782, New York,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 381.6,
"r_x1": 161.2,
"r_y1": 381.6,
"r_x2": 161.2,
"r_y2": 373.6,
"r_x3": 70.0,
"r_y3": 373.6,
"coord_origin": "TOPLEFT"
},
"text": "NY, USA, 2018. ACM. 1",
"orig": "NY, USA, 2018. ACM. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[30] Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas Bekas. Corpus conversion service: A machine learning platform to ingest documents at scale. In Proceedings of the 24th ACM SIGKDD , KDD '18, pages 774-782, New York, NY, USA, 2018. ACM. 1"
},
{
"label": "list_item",
"id": 1,
"page_no": 9,
"cluster": {
"id": 1,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 384.9,
"r": 286.4,
"b": 458.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 392.9,
"r_x1": 65.1,
"r_y1": 392.9,
"r_x2": 65.1,
"r_y2": 384.9,
"r_x3": 50.1,
"r_y3": 384.9,
"coord_origin": "TOPLEFT"
},
"text": "[31]",
"orig": "[31]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.4,
"r_y0": 392.9,
"r_x1": 286.4,
"r_y1": 392.9,
"r_x2": 286.4,
"r_y2": 384.9,
"r_x3": 67.4,
"r_y3": 384.9,
"coord_origin": "TOPLEFT"
},
"text": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-",
"orig": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 403.9,
"r_x1": 286.4,
"r_y1": 403.9,
"r_x2": 286.4,
"r_y2": 395.9,
"r_x3": 70.0,
"r_y3": 395.9,
"coord_origin": "TOPLEFT"
},
"text": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-",
"orig": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 414.9,
"r_x1": 125.5,
"r_y1": 414.9,
"r_x2": 125.5,
"r_y2": 406.8,
"r_x3": 70.0,
"r_y3": 406.8,
"coord_origin": "TOPLEFT"
},
"text": "lia Polosukhin.",
"orig": "lia Polosukhin.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 133.9,
"r_y0": 414.9,
"r_x1": 230.8,
"r_y1": 414.9,
"r_x2": 230.8,
"r_y2": 406.8,
"r_x3": 133.9,
"r_y3": 406.8,
"coord_origin": "TOPLEFT"
},
"text": "Attention is all you need.",
"orig": "Attention is all you need.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.3,
"r_y0": 414.9,
"r_x1": 286.4,
"r_y1": 414.9,
"r_x2": 286.4,
"r_y2": 406.8,
"r_x3": 239.3,
"r_y3": 406.8,
"coord_origin": "TOPLEFT"
},
"text": "In I. Guyon,",
"orig": "In I. Guyon,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 425.8,
"r_x1": 79.0,
"r_y1": 425.8,
"r_x2": 79.0,
"r_y2": 417.8,
"r_x3": 70.0,
"r_y3": 417.8,
"coord_origin": "TOPLEFT"
},
"text": "U.",
"orig": "U.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.3,
"r_y0": 425.8,
"r_x1": 286.4,
"r_y1": 425.8,
"r_x2": 286.4,
"r_y2": 417.8,
"r_x3": 81.3,
"r_y3": 417.8,
"coord_origin": "TOPLEFT"
},
"text": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-",
"orig": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 436.8,
"r_x1": 196.8,
"r_y1": 436.8,
"r_x2": 196.8,
"r_y2": 428.8,
"r_x3": 70.0,
"r_y3": 428.8,
"coord_origin": "TOPLEFT"
},
"text": "wanathan, and R. Garnett, editors,",
"orig": "wanathan, and R. Garnett, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.2,
"r_y0": 436.6,
"r_x1": 286.4,
"r_y1": 436.6,
"r_x2": 286.4,
"r_y2": 428.8,
"r_x3": 200.2,
"r_y3": 428.8,
"coord_origin": "TOPLEFT"
},
"text": "Advances in Neural In-",
"orig": "Advances in Neural In-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 447.5,
"r_x1": 189.2,
"r_y1": 447.5,
"r_x2": 189.2,
"r_y2": 439.8,
"r_x3": 70.0,
"r_y3": 439.8,
"coord_origin": "TOPLEFT"
},
"text": "formation Processing Systems 30",
"orig": "formation Processing Systems 30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.2,
"r_y0": 447.7,
"r_x1": 286.4,
"r_y1": 447.7,
"r_x2": 286.4,
"r_y2": 439.7,
"r_x3": 189.2,
"r_y3": 439.7,
"coord_origin": "TOPLEFT"
},
"text": ", pages 5998-6008. Curran",
"orig": ", pages 5998-6008. Curran",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 458.7,
"r_x1": 158.9,
"r_y1": 458.7,
"r_x2": 158.9,
"r_y2": 450.7,
"r_x3": 70.0,
"r_y3": 450.7,
"coord_origin": "TOPLEFT"
},
"text": "Associates, Inc., 2017. 5",
"orig": "Associates, Inc., 2017. 5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[31] Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszkoreit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Illia Polosukhin. Attention is all you need. In I. Guyon, U. V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vishwanathan, and R. Garnett, editors, Advances in Neural Information Processing Systems 30 , pages 5998-6008. Curran Associates, Inc., 2017. 5"
},
{
"label": "list_item",
"id": 6,
"page_no": 9,
"cluster": {
"id": 6,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 462.0,
"r": 286.4,
"b": 502.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 470.0,
"r_x1": 65.9,
"r_y1": 470.0,
"r_x2": 65.9,
"r_y2": 462.0,
"r_x3": 50.1,
"r_y3": 462.0,
"coord_origin": "TOPLEFT"
},
"text": "[32]",
"orig": "[32]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.3,
"r_y0": 470.0,
"r_x1": 286.4,
"r_y1": 470.0,
"r_x2": 286.4,
"r_y2": 462.0,
"r_x3": 68.3,
"r_y3": 462.0,
"coord_origin": "TOPLEFT"
},
"text": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-",
"orig": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 481.0,
"r_x1": 116.3,
"r_y1": 481.0,
"r_x2": 116.3,
"r_y2": 473.0,
"r_x3": 70.0,
"r_y3": 473.0,
"coord_origin": "TOPLEFT"
},
"text": "mitru Erhan.",
"orig": "mitru Erhan.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.5,
"r_y0": 481.0,
"r_x1": 286.4,
"r_y1": 481.0,
"r_x2": 286.4,
"r_y2": 473.0,
"r_x3": 122.5,
"r_y3": 473.0,
"coord_origin": "TOPLEFT"
},
"text": "Show and tell: A neural image caption gen-",
"orig": "Show and tell: A neural image caption gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 491.9,
"r_x1": 103.3,
"r_y1": 491.9,
"r_x2": 103.3,
"r_y2": 483.9,
"r_x3": 70.0,
"r_y3": 483.9,
"coord_origin": "TOPLEFT"
},
"text": "erator. In",
"orig": "erator. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 105.5,
"r_y0": 491.7,
"r_x1": 286.4,
"r_y1": 491.7,
"r_x2": 286.4,
"r_y2": 484.0,
"r_x3": 105.5,
"r_y3": 484.0,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE Conference on Computer",
"orig": "Proceedings of the IEEE Conference on Computer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 502.7,
"r_x1": 212.5,
"r_y1": 502.7,
"r_x2": 212.5,
"r_y2": 495.0,
"r_x3": 70.0,
"r_y3": 495.0,
"coord_origin": "TOPLEFT"
},
"text": "Vision and Pattern Recognition (CVPR)",
"orig": "Vision and Pattern Recognition (CVPR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 212.5,
"r_y0": 502.9,
"r_x1": 263.6,
"r_y1": 502.9,
"r_x2": 263.6,
"r_y2": 494.9,
"r_x3": 212.5,
"r_y3": 494.9,
"coord_origin": "TOPLEFT"
},
"text": ", June 2015. 2",
"orig": ", June 2015. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[32] Oriol Vinyals, Alexander Toshev, Samy Bengio, and Dumitru Erhan. Show and tell: A neural image caption generator. In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) , June 2015. 2"
},
{
"label": "list_item",
"id": 7,
"page_no": 9,
"cluster": {
"id": 7,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 506.2,
"r": 286.4,
"b": 547.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 514.2,
"r_x1": 65.7,
"r_y1": 514.2,
"r_x2": 65.7,
"r_y2": 506.2,
"r_x3": 50.1,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "[33]",
"orig": "[33]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.0,
"r_y0": 514.2,
"r_x1": 247.4,
"r_y1": 514.2,
"r_x2": 247.4,
"r_y2": 506.2,
"r_x3": 68.0,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.",
"orig": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 254.0,
"r_y0": 514.2,
"r_x1": 286.4,
"r_y1": 514.2,
"r_x2": 286.4,
"r_y2": 506.2,
"r_x3": 254.0,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "Res2tim:",
"orig": "Res2tim:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 525.2,
"r_x1": 265.6,
"r_y1": 525.2,
"r_x2": 265.6,
"r_y2": 517.2,
"r_x3": 70.0,
"r_y3": 517.2,
"coord_origin": "TOPLEFT"
},
"text": "reconstruct syntactic structures from table images. In",
"orig": "reconstruct syntactic structures from table images. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 268.4,
"r_y0": 525.0,
"r_x1": 286.4,
"r_y1": 525.0,
"r_x2": 286.4,
"r_y2": 517.2,
"r_x3": 268.4,
"r_y3": 517.2,
"coord_origin": "TOPLEFT"
},
"text": "2019",
"orig": "2019",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 535.9,
"r_x1": 286.4,
"r_y1": 535.9,
"r_x2": 286.4,
"r_y2": 528.2,
"r_x3": 70.0,
"r_y3": 528.2,
"coord_origin": "TOPLEFT"
},
"text": "International Conference on Document Analysis and Recog-",
"orig": "International Conference on Document Analysis and Recog-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 546.9,
"r_x1": 125.3,
"r_y1": 546.9,
"r_x2": 125.3,
"r_y2": 539.2,
"r_x3": 70.0,
"r_y3": 539.2,
"coord_origin": "TOPLEFT"
},
"text": "nition (ICDAR)",
"orig": "nition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.3,
"r_y0": 547.1,
"r_x1": 240.1,
"r_y1": 547.1,
"r_x2": 240.1,
"r_y2": 539.1,
"r_x3": 125.3,
"r_y3": 539.1,
"coord_origin": "TOPLEFT"
},
"text": ", pages 749-755. IEEE, 2019. 3",
"orig": ", pages 749-755. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[33] Wenyuan Xue, Qingyong Li, and Dacheng Tao. Res2tim: reconstruct syntactic structures from table images. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 749-755. IEEE, 2019. 3"
},
{
"label": "list_item",
"id": 11,
"page_no": 9,
"cluster": {
"id": 11,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 550.4,
"r": 286.4,
"b": 591.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.82,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 558.4,
"r_x1": 66.0,
"r_y1": 558.4,
"r_x2": 66.0,
"r_y2": 550.4,
"r_x3": 50.1,
"r_y3": 550.4,
"coord_origin": "TOPLEFT"
},
"text": "[34]",
"orig": "[34]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.4,
"r_y0": 558.4,
"r_x1": 286.4,
"r_y1": 558.4,
"r_x2": 286.4,
"r_y2": 550.4,
"r_x3": 68.4,
"r_y3": 550.4,
"coord_origin": "TOPLEFT"
},
"text": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,",
"orig": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 569.4,
"r_x1": 137.1,
"r_y1": 569.4,
"r_x2": 137.1,
"r_y2": 561.4,
"r_x3": 70.0,
"r_y3": 561.4,
"coord_origin": "TOPLEFT"
},
"text": "and Qingyong Li.",
"orig": "and Qingyong Li.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 146.0,
"r_y0": 569.4,
"r_x1": 172.4,
"r_y1": 569.4,
"r_x2": 172.4,
"r_y2": 561.4,
"r_x3": 146.0,
"r_y3": 561.4,
"coord_origin": "TOPLEFT"
},
"text": "Tgrnet:",
"orig": "Tgrnet:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 178.7,
"r_y0": 569.4,
"r_x1": 286.4,
"r_y1": 569.4,
"r_x2": 286.4,
"r_y2": 561.4,
"r_x3": 178.7,
"r_y3": 561.4,
"coord_origin": "TOPLEFT"
},
"text": "A table graph reconstruction",
"orig": "A table graph reconstruction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 580.3,
"r_x1": 221.0,
"r_y1": 580.3,
"r_x2": 221.0,
"r_y2": 572.3,
"r_x3": 70.0,
"r_y3": 572.3,
"coord_origin": "TOPLEFT"
},
"text": "network for table structure recognition.",
"orig": "network for table structure recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.5,
"r_y0": 580.1,
"r_x1": 286.4,
"r_y1": 580.1,
"r_x2": 286.4,
"r_y2": 572.4,
"r_x3": 232.5,
"r_y3": 572.4,
"coord_origin": "TOPLEFT"
},
"text": "arXiv preprint",
"orig": "arXiv preprint",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 591.1,
"r_x1": 135.5,
"r_y1": 591.1,
"r_x2": 135.5,
"r_y2": 583.4,
"r_x3": 70.0,
"r_y3": 583.4,
"coord_origin": "TOPLEFT"
},
"text": "arXiv:2106.10598",
"orig": "arXiv:2106.10598",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 135.5,
"r_y0": 591.3,
"r_x1": 167.9,
"r_y1": 591.3,
"r_x2": 167.9,
"r_y2": 583.3,
"r_x3": 135.5,
"r_y3": 583.3,
"coord_origin": "TOPLEFT"
},
"text": ", 2021. 3",
"orig": ", 2021. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[34] Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao, and Qingyong Li. Tgrnet: A table graph reconstruction network for table structure recognition. arXiv preprint arXiv:2106.10598 , 2021. 3"
},
{
"label": "list_item",
"id": 10,
"page_no": 9,
"cluster": {
"id": 10,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 594.6,
"r": 286.4,
"b": 635.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 602.6,
"r_x1": 65.2,
"r_y1": 602.6,
"r_x2": 65.2,
"r_y2": 594.6,
"r_x3": 50.1,
"r_y3": 594.6,
"coord_origin": "TOPLEFT"
},
"text": "[35]",
"orig": "[35]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.5,
"r_y0": 602.6,
"r_x1": 286.4,
"r_y1": 602.6,
"r_x2": 286.4,
"r_y2": 594.6,
"r_x3": 67.5,
"r_y3": 594.6,
"coord_origin": "TOPLEFT"
},
"text": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and",
"orig": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 613.6,
"r_x1": 109.1,
"r_y1": 613.6,
"r_x2": 109.1,
"r_y2": 605.6,
"r_x3": 70.0,
"r_y3": 605.6,
"coord_origin": "TOPLEFT"
},
"text": "Jiebo Luo.",
"orig": "Jiebo Luo.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.2,
"r_y0": 613.6,
"r_x1": 271.8,
"r_y1": 613.6,
"r_x2": 271.8,
"r_y2": 605.6,
"r_x3": 116.2,
"r_y3": 605.6,
"coord_origin": "TOPLEFT"
},
"text": "Image captioning with semantic attention.",
"orig": "Image captioning with semantic attention.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.9,
"r_y0": 613.6,
"r_x1": 286.4,
"r_y1": 613.6,
"r_x2": 286.4,
"r_y2": 605.6,
"r_x3": 278.9,
"r_y3": 605.6,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 624.3,
"r_x1": 286.4,
"r_y1": 624.3,
"r_x2": 286.4,
"r_y2": 616.6,
"r_x3": 70.0,
"r_y3": 616.6,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE conference on computer vision and",
"orig": "Proceedings of the IEEE conference on computer vision and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 635.3,
"r_x1": 139.1,
"r_y1": 635.3,
"r_x2": 139.1,
"r_y2": 627.6,
"r_x3": 70.0,
"r_y3": 627.6,
"coord_origin": "TOPLEFT"
},
"text": "pattern recognition",
"orig": "pattern recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 139.1,
"r_y0": 635.5,
"r_x1": 239.0,
"r_y1": 635.5,
"r_x2": 239.0,
"r_y2": 627.5,
"r_x3": 139.1,
"r_y3": 627.5,
"coord_origin": "TOPLEFT"
},
"text": ", pages 4651-4659, 2016. 4",
"orig": ", pages 4651-4659, 2016. 4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[35] Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and Jiebo Luo. Image captioning with semantic attention. In Proceedings of the IEEE conference on computer vision and pattern recognition , pages 4651-4659, 2016. 4"
},
{
"label": "list_item",
"id": 12,
"page_no": 9,
"cluster": {
"id": 12,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 638.8,
"r": 286.4,
"b": 690.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.81,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 646.8,
"r_x1": 65.2,
"r_y1": 646.8,
"r_x2": 65.2,
"r_y2": 638.8,
"r_x3": 50.1,
"r_y3": 638.8,
"coord_origin": "TOPLEFT"
},
"text": "[36]",
"orig": "[36]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.5,
"r_y0": 646.8,
"r_x1": 286.4,
"r_y1": 646.8,
"r_x2": 286.4,
"r_y2": 638.8,
"r_x3": 67.5,
"r_y3": 638.8,
"coord_origin": "TOPLEFT"
},
"text": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and",
"orig": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 657.8,
"r_x1": 286.4,
"r_y1": 657.8,
"r_x2": 286.4,
"r_y2": 649.8,
"r_x3": 70.0,
"r_y3": 649.8,
"coord_origin": "TOPLEFT"
},
"text": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-",
"orig": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 668.7,
"r_x1": 286.4,
"r_y1": 668.7,
"r_x2": 286.4,
"r_y2": 660.7,
"r_x3": 70.0,
"r_y3": 660.7,
"coord_origin": "TOPLEFT"
},
"text": "work for joint table identification and cell structure recogni-",
"orig": "work for joint table identification and cell structure recogni-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 679.7,
"r_x1": 158.5,
"r_y1": 679.7,
"r_x2": 158.5,
"r_y2": 671.7,
"r_x3": 70.0,
"r_y3": 671.7,
"coord_origin": "TOPLEFT"
},
"text": "tion using visual context.",
"orig": "tion using visual context.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.5,
"r_y0": 679.5,
"r_x1": 286.4,
"r_y1": 679.5,
"r_x2": 286.4,
"r_y2": 671.8,
"r_x3": 160.5,
"r_y3": 671.8,
"coord_origin": "TOPLEFT"
},
"text": "Winter Conference for Applications",
"orig": "Winter Conference for Applications",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 690.4,
"r_x1": 171.4,
"r_y1": 690.4,
"r_x2": 171.4,
"r_y2": 682.7,
"r_x3": 70.0,
"r_y3": 682.7,
"coord_origin": "TOPLEFT"
},
"text": "in Computer Vision (WACV)",
"orig": "in Computer Vision (WACV)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.4,
"r_y0": 690.7,
"r_x1": 212.8,
"r_y1": 690.7,
"r_x2": 212.8,
"r_y2": 682.6,
"r_x3": 171.4,
"r_y3": 682.6,
"coord_origin": "TOPLEFT"
},
"text": ", 2021. 2, 3",
"orig": ", 2021. 2, 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[36] Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and Nancy Xin Ru Wang. Global table extractor (gte): A framework for joint table identification and cell structure recognition using visual context. Winter Conference for Applications in Computer Vision (WACV) , 2021. 2, 3"
},
{
"label": "list_item",
"id": 8,
"page_no": 9,
"cluster": {
"id": 8,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 694.0,
"r": 286.4,
"b": 712.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 702.0,
"r_x1": 66.5,
"r_y1": 702.0,
"r_x2": 66.5,
"r_y2": 694.0,
"r_x3": 50.1,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "[37]",
"orig": "[37]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 69.0,
"r_y0": 702.0,
"r_x1": 81.0,
"r_y1": 702.0,
"r_x2": 81.0,
"r_y2": 694.0,
"r_x3": 69.0,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Xu",
"orig": "Xu",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.1,
"r_y0": 702.0,
"r_x1": 114.7,
"r_y1": 702.0,
"r_x2": 114.7,
"r_y2": 694.0,
"r_x3": 89.1,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Zhong,",
"orig": "Zhong,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 124.2,
"r_y0": 702.0,
"r_x1": 149.1,
"r_y1": 702.0,
"r_x2": 149.1,
"r_y2": 694.0,
"r_x3": 124.2,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Elaheh",
"orig": "Elaheh",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 157.2,
"r_y0": 702.0,
"r_x1": 209.4,
"r_y1": 702.0,
"r_x2": 209.4,
"r_y2": 694.0,
"r_x3": 157.2,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "ShafieiBavani,",
"orig": "ShafieiBavani,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.9,
"r_y0": 702.0,
"r_x1": 231.9,
"r_y1": 702.0,
"r_x2": 231.9,
"r_y2": 694.0,
"r_x3": 218.9,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.9,
"r_y0": 702.0,
"r_x1": 269.3,
"r_y1": 702.0,
"r_x2": 269.3,
"r_y2": 694.0,
"r_x3": 239.9,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Antonio",
"orig": "Antonio",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 277.4,
"r_y0": 702.0,
"r_x1": 286.4,
"r_y1": 702.0,
"r_x2": 286.4,
"r_y2": 694.0,
"r_x3": 277.4,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Ji-",
"orig": "Ji-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 712.9,
"r_x1": 286.4,
"r_y1": 712.9,
"r_x2": 286.4,
"r_y2": 704.9,
"r_x3": 70.0,
"r_y3": 704.9,
"coord_origin": "TOPLEFT"
},
"text": "meno Yepes. Image-based table recognition: Data, model,",
"orig": "meno Yepes. Image-based table recognition: Data, model,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[37] Xu Zhong, Elaheh ShafieiBavani, and Antonio Jimeno Yepes. Image-based table recognition: Data, model,"
},
{
"label": "list_item",
"id": 14,
"page_no": 9,
"cluster": {
"id": 14,
"label": "list_item",
"bbox": {
"l": 328.8,
"t": 75.9,
"r": 545.1,
"b": 116.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.76,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 83.9,
"r_x1": 545.1,
"r_y1": 83.9,
"r_x2": 545.1,
"r_y2": 75.9,
"r_x3": 328.8,
"r_y3": 75.9,
"coord_origin": "TOPLEFT"
},
"text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas",
"orig": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 94.9,
"r_x1": 472.3,
"r_y1": 94.9,
"r_x2": 472.3,
"r_y2": 86.8,
"r_x3": 328.8,
"r_y3": 86.8,
"coord_origin": "TOPLEFT"
},
"text": "Brox, and Jan-Michael Frahm, editors,",
"orig": "Brox, and Jan-Michael Frahm, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 475.9,
"r_y0": 94.7,
"r_x1": 545.1,
"r_y1": 94.7,
"r_x2": 545.1,
"r_y2": 86.9,
"r_x3": 475.9,
"r_y3": 86.9,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision -",
"orig": "Computer Vision -",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 105.6,
"r_x1": 371.9,
"r_y1": 105.6,
"r_x2": 371.9,
"r_y2": 97.9,
"r_x3": 328.8,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "ECCV 2020",
"orig": "ECCV 2020",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 371.9,
"r_y0": 105.8,
"r_x1": 545.1,
"r_y1": 105.8,
"r_x2": 545.1,
"r_y2": 97.8,
"r_x3": 371.9,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 564-580, Cham, 2020. Springer Interna-",
"orig": ", pages 564-580, Cham, 2020. Springer Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 116.8,
"r_x1": 417.7,
"r_y1": 116.8,
"r_x2": 417.7,
"r_y2": 108.8,
"r_x3": 328.8,
"r_y3": 108.8,
"coord_origin": "TOPLEFT"
},
"text": "tional Publishing. 2, 3, 7",
"orig": "tional Publishing. 2, 3, 7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas Brox, and Jan-Michael Frahm, editors, Computer Vision ECCV 2020 , pages 564-580, Cham, 2020. Springer International Publishing. 2, 3, 7"
},
{
"label": "list_item",
"id": 9,
"page_no": 9,
"cluster": {
"id": 9,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 120.7,
"r": 545.1,
"b": 161.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 128.7,
"r_x1": 324.3,
"r_y1": 128.7,
"r_x2": 324.3,
"r_y2": 120.7,
"r_x3": 308.9,
"r_y3": 120.7,
"coord_origin": "TOPLEFT"
},
"text": "[38]",
"orig": "[38]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.7,
"r_y0": 128.7,
"r_x1": 545.1,
"r_y1": 128.7,
"r_x2": 545.1,
"r_y2": 120.7,
"r_x3": 326.7,
"r_y3": 120.7,
"coord_origin": "TOPLEFT"
},
"text": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-",
"orig": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 139.7,
"r_x1": 545.1,
"r_y1": 139.7,
"r_x2": 545.1,
"r_y2": 131.7,
"r_x3": 328.8,
"r_y3": 131.7,
"coord_origin": "TOPLEFT"
},
"text": "laynet: Largest dataset ever for document layout analysis. In",
"orig": "laynet: Largest dataset ever for document layout analysis. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 150.4,
"r_x1": 545.1,
"r_y1": 150.4,
"r_x2": 545.1,
"r_y2": 142.7,
"r_x3": 328.8,
"r_y3": 142.7,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 161.4,
"r_x1": 406.3,
"r_y1": 161.4,
"r_x2": 406.3,
"r_y2": 153.7,
"r_x3": 328.8,
"r_y3": 153.7,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.3,
"r_y0": 161.6,
"r_x1": 506.2,
"r_y1": 161.6,
"r_x2": 506.2,
"r_y2": 153.6,
"r_x3": 406.3,
"r_y3": 153.6,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1015-1022, 2019. 1",
"orig": ", pages 1015-1022, 2019. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[38] Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Publaynet: Largest dataset ever for document layout analysis. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 1015-1022, 2019. 1"
},
{
"label": "page_footer",
"id": 0,
"page_no": 9,
"cluster": {
"id": 0,
"label": "page_footer",
"bbox": {
"l": 292.6,
"t": 734.1,
"r": 302.6,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "10"
}
],
"body": [
{
"label": "text",
"id": 15,
"page_no": 9,
"cluster": {
"id": 15,
"label": "text",
"bbox": {
"l": 70.0,
"t": 75.9,
"r": 286.4,
"b": 94.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.69,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 83.7,
"r_x1": 223.6,
"r_y1": 83.7,
"r_x2": 223.6,
"r_y2": 76.0,
"r_x3": 70.0,
"r_y3": 76.0,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision and Pattern Recognition",
"orig": "Computer Vision and Pattern Recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 223.6,
"r_y0": 83.9,
"r_x1": 286.4,
"r_y1": 83.9,
"r_x2": 286.4,
"r_y2": 75.9,
"r_x3": 223.6,
"r_y3": 75.9,
"coord_origin": "TOPLEFT"
},
"text": ", pages 658-666,",
"orig": ", pages 658-666,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 94.9,
"r_x1": 97.9,
"r_y1": 94.9,
"r_x2": 97.9,
"r_y2": 86.8,
"r_x3": 70.0,
"r_y3": 86.8,
"coord_origin": "TOPLEFT"
},
"text": "2019. 6",
"orig": "2019. 6",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Computer Vision and Pattern Recognition , pages 658-666, 2019. 6"
},
{
"label": "list_item",
"id": 13,
"page_no": 9,
"cluster": {
"id": 13,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 98.2,
"r": 286.4,
"b": 161.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.77,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 106.2,
"r_x1": 65.5,
"r_y1": 106.2,
"r_x2": 65.5,
"r_y2": 98.2,
"r_x3": 50.1,
"r_y3": 98.2,
"coord_origin": "TOPLEFT"
},
"text": "[26]",
"orig": "[26]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 106.2,
"r_x1": 286.4,
"r_y1": 106.2,
"r_x2": 286.4,
"r_y2": 98.2,
"r_x3": 67.8,
"r_y3": 98.2,
"coord_origin": "TOPLEFT"
},
"text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 117.1,
"r_x1": 286.4,
"r_y1": 117.1,
"r_x2": 286.4,
"r_y2": 109.1,
"r_x3": 70.0,
"r_y3": 109.1,
"coord_origin": "TOPLEFT"
},
"text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-",
"orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 128.1,
"r_x1": 286.4,
"r_y1": 128.1,
"r_x2": 286.4,
"r_y2": 120.1,
"r_x3": 70.0,
"r_y3": 120.1,
"coord_origin": "TOPLEFT"
},
"text": "tion and structure recognition of tables in document images.",
"orig": "tion and structure recognition of tables in document images.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 139.1,
"r_x1": 77.5,
"r_y1": 139.1,
"r_x2": 77.5,
"r_y2": 131.0,
"r_x3": 70.0,
"r_y3": 131.0,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 80.6,
"r_y0": 138.9,
"r_x1": 286.4,
"r_y1": 138.9,
"r_x2": 286.4,
"r_y2": 131.1,
"r_x3": 80.6,
"r_y3": 131.1,
"coord_origin": "TOPLEFT"
},
"text": "2017 14th IAPR International Conference on Document",
"orig": "2017 14th IAPR International Conference on Document",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 149.8,
"r_x1": 195.2,
"r_y1": 149.8,
"r_x2": 195.2,
"r_y2": 142.1,
"r_x3": 70.0,
"r_y3": 142.1,
"coord_origin": "TOPLEFT"
},
"text": "Analysis and Recognition (ICDAR)",
"orig": "Analysis and Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 195.2,
"r_y0": 150.0,
"r_x1": 286.4,
"r_y1": 150.0,
"r_x2": 286.4,
"r_y2": 142.0,
"r_x3": 195.2,
"r_y3": 142.0,
"coord_origin": "TOPLEFT"
},
"text": ", volume 01, pages 1162-",
"orig": ", volume 01, pages 1162-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 161.0,
"r_x1": 120.3,
"r_y1": 161.0,
"r_x2": 120.3,
"r_y2": 153.0,
"r_x3": 70.0,
"r_y3": 153.0,
"coord_origin": "TOPLEFT"
},
"text": "1167, 2017. 1",
"orig": "1167, 2017. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[26] Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Dengel, and Sheraz Ahmed. Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR) , volume 01, pages 11621167, 2017. 1"
},
{
"label": "list_item",
"id": 2,
"page_no": 9,
"cluster": {
"id": 2,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 164.3,
"r": 286.4,
"b": 227.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.86,
"cells": [
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 172.3,
"r_x1": 65.5,
"r_y1": 172.3,
"r_x2": 65.5,
"r_y2": 164.3,
"r_x3": 50.1,
"r_y3": 164.3,
"coord_origin": "TOPLEFT"
},
"text": "[27]",
"orig": "[27]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 172.3,
"r_x1": 286.4,
"r_y1": 172.3,
"r_x2": 286.4,
"r_y2": 164.3,
"r_x3": 67.8,
"r_y3": 164.3,
"coord_origin": "TOPLEFT"
},
"text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 183.3,
"r_x1": 286.4,
"r_y1": 183.3,
"r_x2": 286.4,
"r_y2": 175.2,
"r_x3": 70.0,
"r_y3": 175.2,
"coord_origin": "TOPLEFT"
},
"text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-",
"orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 194.2,
"r_x1": 286.4,
"r_y1": 194.2,
"r_x2": 286.4,
"r_y2": 186.2,
"r_x3": 70.0,
"r_y3": 186.2,
"coord_origin": "TOPLEFT"
},
"text": "tection and structure recognition of tables in document im-",
"orig": "tection and structure recognition of tables in document im-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 205.2,
"r_x1": 101.3,
"r_y1": 205.2,
"r_x2": 101.3,
"r_y2": 197.2,
"r_x3": 70.0,
"r_y3": 197.2,
"coord_origin": "TOPLEFT"
},
"text": "ages. In",
"orig": "ages. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 104.3,
"r_y0": 205.0,
"r_x1": 286.4,
"r_y1": 205.0,
"r_x2": 286.4,
"r_y2": 197.2,
"r_x3": 104.3,
"r_y3": 197.2,
"coord_origin": "TOPLEFT"
},
"text": "2017 14th IAPR international conference on doc-",
"orig": "2017 14th IAPR international conference on doc-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 215.9,
"r_x1": 220.5,
"r_y1": 215.9,
"r_x2": 220.5,
"r_y2": 208.2,
"r_x3": 70.0,
"r_y3": 208.2,
"coord_origin": "TOPLEFT"
},
"text": "ument analysis and recognition (ICDAR)",
"orig": "ument analysis and recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.5,
"r_y0": 216.1,
"r_x1": 286.4,
"r_y1": 216.1,
"r_x2": 286.4,
"r_y2": 208.1,
"r_x3": 220.5,
"r_y3": 208.1,
"coord_origin": "TOPLEFT"
},
"text": ", volume 1, pages",
"orig": ", volume 1, pages",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 227.1,
"r_x1": 166.7,
"r_y1": 227.1,
"r_x2": 166.7,
"r_y2": 219.1,
"r_x3": 70.0,
"r_y3": 219.1,
"coord_origin": "TOPLEFT"
},
"text": "1162-1167. IEEE, 2017. 3",
"orig": "1162-1167. IEEE, 2017. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[27] Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Dengel, and Sheraz Ahmed. Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In 2017 14th IAPR international conference on document analysis and recognition (ICDAR) , volume 1, pages 1162-1167. IEEE, 2017. 3"
},
{
"label": "list_item",
"id": 4,
"page_no": 9,
"cluster": {
"id": 4,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 230.4,
"r": 286.4,
"b": 271.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.85,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 238.4,
"r_x1": 65.7,
"r_y1": 238.4,
"r_x2": 65.7,
"r_y2": 230.4,
"r_x3": 50.1,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "[28]",
"orig": "[28]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.0,
"r_y0": 238.4,
"r_x1": 286.4,
"r_y1": 238.4,
"r_x2": 286.4,
"r_y2": 230.4,
"r_x3": 68.0,
"r_y3": 230.4,
"coord_origin": "TOPLEFT"
},
"text": "Faisal Shafait and Ray Smith. Table detection in heteroge-",
"orig": "Faisal Shafait and Ray Smith. Table detection in heteroge-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 249.4,
"r_x1": 147.2,
"r_y1": 249.4,
"r_x2": 147.2,
"r_y2": 241.4,
"r_x3": 70.0,
"r_y3": 241.4,
"coord_origin": "TOPLEFT"
},
"text": "neous documents. In",
"orig": "neous documents. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 149.9,
"r_y0": 249.2,
"r_x1": 286.4,
"r_y1": 249.2,
"r_x2": 286.4,
"r_y2": 241.4,
"r_x3": 149.9,
"r_y3": 241.4,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the 9th IAPR Interna-",
"orig": "Proceedings of the 9th IAPR Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 260.1,
"r_x1": 244.7,
"r_y1": 260.1,
"r_x2": 244.7,
"r_y2": 252.4,
"r_x3": 70.0,
"r_y3": 252.4,
"coord_origin": "TOPLEFT"
},
"text": "tional Workshop on Document Analysis Systems",
"orig": "tional Workshop on Document Analysis Systems",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 244.7,
"r_y0": 260.3,
"r_x1": 286.4,
"r_y1": 260.3,
"r_x2": 286.4,
"r_y2": 252.3,
"r_x3": 244.7,
"r_y3": 252.3,
"coord_origin": "TOPLEFT"
},
"text": ", pages 65-",
"orig": ", pages 65-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 271.3,
"r_x1": 111.4,
"r_y1": 271.3,
"r_x2": 111.4,
"r_y2": 263.3,
"r_x3": 70.0,
"r_y3": 263.3,
"coord_origin": "TOPLEFT"
},
"text": "72, 2010. 2",
"orig": "72, 2010. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[28] Faisal Shafait and Ray Smith. Table detection in heterogeneous documents. In Proceedings of the 9th IAPR International Workshop on Document Analysis Systems , pages 6572, 2010. 2"
},
{
"label": "list_item",
"id": 5,
"page_no": 9,
"cluster": {
"id": 5,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 274.6,
"r": 286.4,
"b": 326.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.85,
"cells": [
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 282.6,
"r_x1": 66.0,
"r_y1": 282.6,
"r_x2": 66.0,
"r_y2": 274.6,
"r_x3": 50.1,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "[29]",
"orig": "[29]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.4,
"r_y0": 282.6,
"r_x1": 94.9,
"r_y1": 282.6,
"r_x2": 94.9,
"r_y2": 274.6,
"r_x3": 68.4,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Shoaib",
"orig": "Shoaib",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 100.9,
"r_y0": 282.6,
"r_x1": 127.3,
"r_y1": 282.6,
"r_x2": 127.3,
"r_y2": 274.6,
"r_x3": 100.9,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Ahmed",
"orig": "Ahmed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 133.2,
"r_y0": 282.6,
"r_x1": 165.8,
"r_y1": 282.6,
"r_x2": 165.8,
"r_y2": 274.6,
"r_x3": 133.2,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Siddiqui,",
"orig": "Siddiqui,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 172.7,
"r_y0": 282.6,
"r_x1": 194.1,
"r_y1": 282.6,
"r_x2": 194.1,
"r_y2": 274.6,
"r_x3": 172.7,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Imran",
"orig": "Imran",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.0,
"r_y0": 282.6,
"r_x1": 211.5,
"r_y1": 282.6,
"r_x2": 211.5,
"r_y2": 274.6,
"r_x3": 200.0,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Ali",
"orig": "Ali",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 217.4,
"r_y0": 282.6,
"r_x1": 239.4,
"r_y1": 282.6,
"r_x2": 239.4,
"r_y2": 274.6,
"r_x3": 217.4,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Fateh,",
"orig": "Fateh,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.3,
"r_y0": 282.6,
"r_x1": 264.2,
"r_y1": 282.6,
"r_x2": 264.2,
"r_y2": 274.6,
"r_x3": 246.3,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Syed",
"orig": "Syed",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 270.1,
"r_y0": 282.6,
"r_x1": 286.4,
"r_y1": 282.6,
"r_x2": 286.4,
"r_y2": 274.6,
"r_x3": 270.1,
"r_y3": 274.6,
"coord_origin": "TOPLEFT"
},
"text": "Tah-",
"orig": "Tah-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 293.6,
"r_x1": 286.4,
"r_y1": 293.6,
"r_x2": 286.4,
"r_y2": 285.6,
"r_x3": 70.0,
"r_y3": 285.6,
"coord_origin": "TOPLEFT"
},
"text": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.",
"orig": "seen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 304.5,
"r_x1": 286.4,
"r_y1": 304.5,
"r_x2": 286.4,
"r_y2": 296.5,
"r_x3": 70.0,
"r_y3": 296.5,
"coord_origin": "TOPLEFT"
},
"text": "Deeptabstr: Deep learning based table structure recognition.",
"orig": "Deeptabstr: Deep learning based table structure recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 315.5,
"r_x1": 77.5,
"r_y1": 315.5,
"r_x2": 77.5,
"r_y2": 307.5,
"r_x3": 70.0,
"r_y3": 307.5,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 79.4,
"r_y0": 315.3,
"r_x1": 286.4,
"r_y1": 315.3,
"r_x2": 286.4,
"r_y2": 307.6,
"r_x3": 79.4,
"r_y3": 307.6,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 326.2,
"r_x1": 147.6,
"r_y1": 326.2,
"r_x2": 147.6,
"r_y2": 318.5,
"r_x3": 70.0,
"r_y3": 318.5,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 147.6,
"r_y0": 326.5,
"r_x1": 271.3,
"r_y1": 326.5,
"r_x2": 271.3,
"r_y2": 318.4,
"r_x3": 147.6,
"r_y3": 318.4,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1403-1409. IEEE, 2019. 3",
"orig": ", pages 1403-1409. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[29] Shoaib Ahmed Siddiqui, Imran Ali Fateh, Syed Tahseen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed. Deeptabstr: Deep learning based table structure recognition. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 1403-1409. IEEE, 2019. 3"
},
{
"label": "list_item",
"id": 3,
"page_no": 9,
"cluster": {
"id": 3,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 329.8,
"r": 286.4,
"b": 381.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.86,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 337.8,
"r_x1": 65.4,
"r_y1": 337.8,
"r_x2": 65.4,
"r_y2": 329.8,
"r_x3": 50.1,
"r_y3": 329.8,
"coord_origin": "TOPLEFT"
},
"text": "[30]",
"orig": "[30]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.7,
"r_y0": 337.8,
"r_x1": 286.4,
"r_y1": 337.8,
"r_x2": 286.4,
"r_y2": 329.8,
"r_x3": 67.7,
"r_y3": 329.8,
"coord_origin": "TOPLEFT"
},
"text": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas",
"orig": "Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 348.7,
"r_x1": 286.4,
"r_y1": 348.7,
"r_x2": 286.4,
"r_y2": 340.7,
"r_x3": 70.0,
"r_y3": 340.7,
"coord_origin": "TOPLEFT"
},
"text": "Bekas. Corpus conversion service: A machine learning plat-",
"orig": "Bekas. Corpus conversion service: A machine learning plat-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 359.7,
"r_x1": 198.8,
"r_y1": 359.7,
"r_x2": 198.8,
"r_y2": 351.7,
"r_x3": 70.0,
"r_y3": 351.7,
"coord_origin": "TOPLEFT"
},
"text": "form to ingest documents at scale.",
"orig": "form to ingest documents at scale.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.1,
"r_y0": 359.7,
"r_x1": 213.5,
"r_y1": 359.7,
"r_x2": 213.5,
"r_y2": 351.7,
"r_x3": 206.1,
"r_y3": 351.7,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 217.0,
"r_y0": 359.5,
"r_x1": 286.4,
"r_y1": 359.5,
"r_x2": 286.4,
"r_y2": 351.8,
"r_x3": 217.0,
"r_y3": 351.8,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the",
"orig": "Proceedings of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 370.4,
"r_x1": 143.1,
"r_y1": 370.4,
"r_x2": 143.1,
"r_y2": 362.7,
"r_x3": 70.0,
"r_y3": 362.7,
"coord_origin": "TOPLEFT"
},
"text": "24th ACM SIGKDD",
"orig": "24th ACM SIGKDD",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 143.1,
"r_y0": 370.7,
"r_x1": 286.4,
"r_y1": 370.7,
"r_x2": 286.4,
"r_y2": 362.6,
"r_x3": 143.1,
"r_y3": 362.6,
"coord_origin": "TOPLEFT"
},
"text": ", KDD \u201918, pages 774-782, New York,",
"orig": ", KDD \u201918, pages 774-782, New York,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 381.6,
"r_x1": 161.2,
"r_y1": 381.6,
"r_x2": 161.2,
"r_y2": 373.6,
"r_x3": 70.0,
"r_y3": 373.6,
"coord_origin": "TOPLEFT"
},
"text": "NY, USA, 2018. ACM. 1",
"orig": "NY, USA, 2018. ACM. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[30] Peter W J Staar, Michele Dolfi, Christoph Auer, and Costas Bekas. Corpus conversion service: A machine learning platform to ingest documents at scale. In Proceedings of the 24th ACM SIGKDD , KDD '18, pages 774-782, New York, NY, USA, 2018. ACM. 1"
},
{
"label": "list_item",
"id": 1,
"page_no": 9,
"cluster": {
"id": 1,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 384.9,
"r": 286.4,
"b": 458.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 392.9,
"r_x1": 65.1,
"r_y1": 392.9,
"r_x2": 65.1,
"r_y2": 384.9,
"r_x3": 50.1,
"r_y3": 384.9,
"coord_origin": "TOPLEFT"
},
"text": "[31]",
"orig": "[31]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.4,
"r_y0": 392.9,
"r_x1": 286.4,
"r_y1": 392.9,
"r_x2": 286.4,
"r_y2": 384.9,
"r_x3": 67.4,
"r_y3": 384.9,
"coord_origin": "TOPLEFT"
},
"text": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-",
"orig": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 403.9,
"r_x1": 286.4,
"r_y1": 403.9,
"r_x2": 286.4,
"r_y2": 395.9,
"r_x3": 70.0,
"r_y3": 395.9,
"coord_origin": "TOPLEFT"
},
"text": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-",
"orig": "reit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 414.9,
"r_x1": 125.5,
"r_y1": 414.9,
"r_x2": 125.5,
"r_y2": 406.8,
"r_x3": 70.0,
"r_y3": 406.8,
"coord_origin": "TOPLEFT"
},
"text": "lia Polosukhin.",
"orig": "lia Polosukhin.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 133.9,
"r_y0": 414.9,
"r_x1": 230.8,
"r_y1": 414.9,
"r_x2": 230.8,
"r_y2": 406.8,
"r_x3": 133.9,
"r_y3": 406.8,
"coord_origin": "TOPLEFT"
},
"text": "Attention is all you need.",
"orig": "Attention is all you need.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.3,
"r_y0": 414.9,
"r_x1": 286.4,
"r_y1": 414.9,
"r_x2": 286.4,
"r_y2": 406.8,
"r_x3": 239.3,
"r_y3": 406.8,
"coord_origin": "TOPLEFT"
},
"text": "In I. Guyon,",
"orig": "In I. Guyon,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 425.8,
"r_x1": 79.0,
"r_y1": 425.8,
"r_x2": 79.0,
"r_y2": 417.8,
"r_x3": 70.0,
"r_y3": 417.8,
"coord_origin": "TOPLEFT"
},
"text": "U.",
"orig": "U.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 81.3,
"r_y0": 425.8,
"r_x1": 286.4,
"r_y1": 425.8,
"r_x2": 286.4,
"r_y2": 417.8,
"r_x3": 81.3,
"r_y3": 417.8,
"coord_origin": "TOPLEFT"
},
"text": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-",
"orig": "V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 436.8,
"r_x1": 196.8,
"r_y1": 436.8,
"r_x2": 196.8,
"r_y2": 428.8,
"r_x3": 70.0,
"r_y3": 428.8,
"coord_origin": "TOPLEFT"
},
"text": "wanathan, and R. Garnett, editors,",
"orig": "wanathan, and R. Garnett, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 200.2,
"r_y0": 436.6,
"r_x1": 286.4,
"r_y1": 436.6,
"r_x2": 286.4,
"r_y2": 428.8,
"r_x3": 200.2,
"r_y3": 428.8,
"coord_origin": "TOPLEFT"
},
"text": "Advances in Neural In-",
"orig": "Advances in Neural In-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 447.5,
"r_x1": 189.2,
"r_y1": 447.5,
"r_x2": 189.2,
"r_y2": 439.8,
"r_x3": 70.0,
"r_y3": 439.8,
"coord_origin": "TOPLEFT"
},
"text": "formation Processing Systems 30",
"orig": "formation Processing Systems 30",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 189.2,
"r_y0": 447.7,
"r_x1": 286.4,
"r_y1": 447.7,
"r_x2": 286.4,
"r_y2": 439.7,
"r_x3": 189.2,
"r_y3": 439.7,
"coord_origin": "TOPLEFT"
},
"text": ", pages 5998-6008. Curran",
"orig": ", pages 5998-6008. Curran",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 458.7,
"r_x1": 158.9,
"r_y1": 458.7,
"r_x2": 158.9,
"r_y2": 450.7,
"r_x3": 70.0,
"r_y3": 450.7,
"coord_origin": "TOPLEFT"
},
"text": "Associates, Inc., 2017. 5",
"orig": "Associates, Inc., 2017. 5",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[31] Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszkoreit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Illia Polosukhin. Attention is all you need. In I. Guyon, U. V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vishwanathan, and R. Garnett, editors, Advances in Neural Information Processing Systems 30 , pages 5998-6008. Curran Associates, Inc., 2017. 5"
},
{
"label": "list_item",
"id": 6,
"page_no": 9,
"cluster": {
"id": 6,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 462.0,
"r": 286.4,
"b": 502.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 470.0,
"r_x1": 65.9,
"r_y1": 470.0,
"r_x2": 65.9,
"r_y2": 462.0,
"r_x3": 50.1,
"r_y3": 462.0,
"coord_origin": "TOPLEFT"
},
"text": "[32]",
"orig": "[32]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.3,
"r_y0": 470.0,
"r_x1": 286.4,
"r_y1": 470.0,
"r_x2": 286.4,
"r_y2": 462.0,
"r_x3": 68.3,
"r_y3": 462.0,
"coord_origin": "TOPLEFT"
},
"text": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-",
"orig": "Oriol Vinyals, Alexander Toshev, Samy Bengio, and Du-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 481.0,
"r_x1": 116.3,
"r_y1": 481.0,
"r_x2": 116.3,
"r_y2": 473.0,
"r_x3": 70.0,
"r_y3": 473.0,
"coord_origin": "TOPLEFT"
},
"text": "mitru Erhan.",
"orig": "mitru Erhan.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.5,
"r_y0": 481.0,
"r_x1": 286.4,
"r_y1": 481.0,
"r_x2": 286.4,
"r_y2": 473.0,
"r_x3": 122.5,
"r_y3": 473.0,
"coord_origin": "TOPLEFT"
},
"text": "Show and tell: A neural image caption gen-",
"orig": "Show and tell: A neural image caption gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 491.9,
"r_x1": 103.3,
"r_y1": 491.9,
"r_x2": 103.3,
"r_y2": 483.9,
"r_x3": 70.0,
"r_y3": 483.9,
"coord_origin": "TOPLEFT"
},
"text": "erator. In",
"orig": "erator. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 105.5,
"r_y0": 491.7,
"r_x1": 286.4,
"r_y1": 491.7,
"r_x2": 286.4,
"r_y2": 484.0,
"r_x3": 105.5,
"r_y3": 484.0,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE Conference on Computer",
"orig": "Proceedings of the IEEE Conference on Computer",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 502.7,
"r_x1": 212.5,
"r_y1": 502.7,
"r_x2": 212.5,
"r_y2": 495.0,
"r_x3": 70.0,
"r_y3": 495.0,
"coord_origin": "TOPLEFT"
},
"text": "Vision and Pattern Recognition (CVPR)",
"orig": "Vision and Pattern Recognition (CVPR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 212.5,
"r_y0": 502.9,
"r_x1": 263.6,
"r_y1": 502.9,
"r_x2": 263.6,
"r_y2": 494.9,
"r_x3": 212.5,
"r_y3": 494.9,
"coord_origin": "TOPLEFT"
},
"text": ", June 2015. 2",
"orig": ", June 2015. 2",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[32] Oriol Vinyals, Alexander Toshev, Samy Bengio, and Dumitru Erhan. Show and tell: A neural image caption generator. In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) , June 2015. 2"
},
{
"label": "list_item",
"id": 7,
"page_no": 9,
"cluster": {
"id": 7,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 506.2,
"r": 286.4,
"b": 547.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 514.2,
"r_x1": 65.7,
"r_y1": 514.2,
"r_x2": 65.7,
"r_y2": 506.2,
"r_x3": 50.1,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "[33]",
"orig": "[33]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.0,
"r_y0": 514.2,
"r_x1": 247.4,
"r_y1": 514.2,
"r_x2": 247.4,
"r_y2": 506.2,
"r_x3": 68.0,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.",
"orig": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 254.0,
"r_y0": 514.2,
"r_x1": 286.4,
"r_y1": 514.2,
"r_x2": 286.4,
"r_y2": 506.2,
"r_x3": 254.0,
"r_y3": 506.2,
"coord_origin": "TOPLEFT"
},
"text": "Res2tim:",
"orig": "Res2tim:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 525.2,
"r_x1": 265.6,
"r_y1": 525.2,
"r_x2": 265.6,
"r_y2": 517.2,
"r_x3": 70.0,
"r_y3": 517.2,
"coord_origin": "TOPLEFT"
},
"text": "reconstruct syntactic structures from table images. In",
"orig": "reconstruct syntactic structures from table images. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 268.4,
"r_y0": 525.0,
"r_x1": 286.4,
"r_y1": 525.0,
"r_x2": 286.4,
"r_y2": 517.2,
"r_x3": 268.4,
"r_y3": 517.2,
"coord_origin": "TOPLEFT"
},
"text": "2019",
"orig": "2019",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 535.9,
"r_x1": 286.4,
"r_y1": 535.9,
"r_x2": 286.4,
"r_y2": 528.2,
"r_x3": 70.0,
"r_y3": 528.2,
"coord_origin": "TOPLEFT"
},
"text": "International Conference on Document Analysis and Recog-",
"orig": "International Conference on Document Analysis and Recog-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 546.9,
"r_x1": 125.3,
"r_y1": 546.9,
"r_x2": 125.3,
"r_y2": 539.2,
"r_x3": 70.0,
"r_y3": 539.2,
"coord_origin": "TOPLEFT"
},
"text": "nition (ICDAR)",
"orig": "nition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.3,
"r_y0": 547.1,
"r_x1": 240.1,
"r_y1": 547.1,
"r_x2": 240.1,
"r_y2": 539.1,
"r_x3": 125.3,
"r_y3": 539.1,
"coord_origin": "TOPLEFT"
},
"text": ", pages 749-755. IEEE, 2019. 3",
"orig": ", pages 749-755. IEEE, 2019. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[33] Wenyuan Xue, Qingyong Li, and Dacheng Tao. Res2tim: reconstruct syntactic structures from table images. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 749-755. IEEE, 2019. 3"
},
{
"label": "list_item",
"id": 11,
"page_no": 9,
"cluster": {
"id": 11,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 550.4,
"r": 286.4,
"b": 591.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.82,
"cells": [
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 558.4,
"r_x1": 66.0,
"r_y1": 558.4,
"r_x2": 66.0,
"r_y2": 550.4,
"r_x3": 50.1,
"r_y3": 550.4,
"coord_origin": "TOPLEFT"
},
"text": "[34]",
"orig": "[34]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 68.4,
"r_y0": 558.4,
"r_x1": 286.4,
"r_y1": 558.4,
"r_x2": 286.4,
"r_y2": 550.4,
"r_x3": 68.4,
"r_y3": 550.4,
"coord_origin": "TOPLEFT"
},
"text": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,",
"orig": "Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 569.4,
"r_x1": 137.1,
"r_y1": 569.4,
"r_x2": 137.1,
"r_y2": 561.4,
"r_x3": 70.0,
"r_y3": 561.4,
"coord_origin": "TOPLEFT"
},
"text": "and Qingyong Li.",
"orig": "and Qingyong Li.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 146.0,
"r_y0": 569.4,
"r_x1": 172.4,
"r_y1": 569.4,
"r_x2": 172.4,
"r_y2": 561.4,
"r_x3": 146.0,
"r_y3": 561.4,
"coord_origin": "TOPLEFT"
},
"text": "Tgrnet:",
"orig": "Tgrnet:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 178.7,
"r_y0": 569.4,
"r_x1": 286.4,
"r_y1": 569.4,
"r_x2": 286.4,
"r_y2": 561.4,
"r_x3": 178.7,
"r_y3": 561.4,
"coord_origin": "TOPLEFT"
},
"text": "A table graph reconstruction",
"orig": "A table graph reconstruction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 580.3,
"r_x1": 221.0,
"r_y1": 580.3,
"r_x2": 221.0,
"r_y2": 572.3,
"r_x3": 70.0,
"r_y3": 572.3,
"coord_origin": "TOPLEFT"
},
"text": "network for table structure recognition.",
"orig": "network for table structure recognition.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.5,
"r_y0": 580.1,
"r_x1": 286.4,
"r_y1": 580.1,
"r_x2": 286.4,
"r_y2": 572.4,
"r_x3": 232.5,
"r_y3": 572.4,
"coord_origin": "TOPLEFT"
},
"text": "arXiv preprint",
"orig": "arXiv preprint",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 591.1,
"r_x1": 135.5,
"r_y1": 591.1,
"r_x2": 135.5,
"r_y2": 583.4,
"r_x3": 70.0,
"r_y3": 583.4,
"coord_origin": "TOPLEFT"
},
"text": "arXiv:2106.10598",
"orig": "arXiv:2106.10598",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 135.5,
"r_y0": 591.3,
"r_x1": 167.9,
"r_y1": 591.3,
"r_x2": 167.9,
"r_y2": 583.3,
"r_x3": 135.5,
"r_y3": 583.3,
"coord_origin": "TOPLEFT"
},
"text": ", 2021. 3",
"orig": ", 2021. 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[34] Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao, and Qingyong Li. Tgrnet: A table graph reconstruction network for table structure recognition. arXiv preprint arXiv:2106.10598 , 2021. 3"
},
{
"label": "list_item",
"id": 10,
"page_no": 9,
"cluster": {
"id": 10,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 594.6,
"r": 286.4,
"b": 635.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 602.6,
"r_x1": 65.2,
"r_y1": 602.6,
"r_x2": 65.2,
"r_y2": 594.6,
"r_x3": 50.1,
"r_y3": 594.6,
"coord_origin": "TOPLEFT"
},
"text": "[35]",
"orig": "[35]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.5,
"r_y0": 602.6,
"r_x1": 286.4,
"r_y1": 602.6,
"r_x2": 286.4,
"r_y2": 594.6,
"r_x3": 67.5,
"r_y3": 594.6,
"coord_origin": "TOPLEFT"
},
"text": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and",
"orig": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 613.6,
"r_x1": 109.1,
"r_y1": 613.6,
"r_x2": 109.1,
"r_y2": 605.6,
"r_x3": 70.0,
"r_y3": 605.6,
"coord_origin": "TOPLEFT"
},
"text": "Jiebo Luo.",
"orig": "Jiebo Luo.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.2,
"r_y0": 613.6,
"r_x1": 271.8,
"r_y1": 613.6,
"r_x2": 271.8,
"r_y2": 605.6,
"r_x3": 116.2,
"r_y3": 605.6,
"coord_origin": "TOPLEFT"
},
"text": "Image captioning with semantic attention.",
"orig": "Image captioning with semantic attention.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 278.9,
"r_y0": 613.6,
"r_x1": 286.4,
"r_y1": 613.6,
"r_x2": 286.4,
"r_y2": 605.6,
"r_x3": 278.9,
"r_y3": 605.6,
"coord_origin": "TOPLEFT"
},
"text": "In",
"orig": "In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 624.3,
"r_x1": 286.4,
"r_y1": 624.3,
"r_x2": 286.4,
"r_y2": 616.6,
"r_x3": 70.0,
"r_y3": 616.6,
"coord_origin": "TOPLEFT"
},
"text": "Proceedings of the IEEE conference on computer vision and",
"orig": "Proceedings of the IEEE conference on computer vision and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 635.3,
"r_x1": 139.1,
"r_y1": 635.3,
"r_x2": 139.1,
"r_y2": 627.6,
"r_x3": 70.0,
"r_y3": 627.6,
"coord_origin": "TOPLEFT"
},
"text": "pattern recognition",
"orig": "pattern recognition",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 139.1,
"r_y0": 635.5,
"r_x1": 239.0,
"r_y1": 635.5,
"r_x2": 239.0,
"r_y2": 627.5,
"r_x3": 139.1,
"r_y3": 627.5,
"coord_origin": "TOPLEFT"
},
"text": ", pages 4651-4659, 2016. 4",
"orig": ", pages 4651-4659, 2016. 4",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[35] Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and Jiebo Luo. Image captioning with semantic attention. In Proceedings of the IEEE conference on computer vision and pattern recognition , pages 4651-4659, 2016. 4"
},
{
"label": "list_item",
"id": 12,
"page_no": 9,
"cluster": {
"id": 12,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 638.8,
"r": 286.4,
"b": 690.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.81,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 646.8,
"r_x1": 65.2,
"r_y1": 646.8,
"r_x2": 65.2,
"r_y2": 638.8,
"r_x3": 50.1,
"r_y3": 638.8,
"coord_origin": "TOPLEFT"
},
"text": "[36]",
"orig": "[36]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.5,
"r_y0": 646.8,
"r_x1": 286.4,
"r_y1": 646.8,
"r_x2": 286.4,
"r_y2": 638.8,
"r_x3": 67.5,
"r_y3": 638.8,
"coord_origin": "TOPLEFT"
},
"text": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and",
"orig": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 657.8,
"r_x1": 286.4,
"r_y1": 657.8,
"r_x2": 286.4,
"r_y2": 649.8,
"r_x3": 70.0,
"r_y3": 649.8,
"coord_origin": "TOPLEFT"
},
"text": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-",
"orig": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 668.7,
"r_x1": 286.4,
"r_y1": 668.7,
"r_x2": 286.4,
"r_y2": 660.7,
"r_x3": 70.0,
"r_y3": 660.7,
"coord_origin": "TOPLEFT"
},
"text": "work for joint table identification and cell structure recogni-",
"orig": "work for joint table identification and cell structure recogni-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 679.7,
"r_x1": 158.5,
"r_y1": 679.7,
"r_x2": 158.5,
"r_y2": 671.7,
"r_x3": 70.0,
"r_y3": 671.7,
"coord_origin": "TOPLEFT"
},
"text": "tion using visual context.",
"orig": "tion using visual context.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.5,
"r_y0": 679.5,
"r_x1": 286.4,
"r_y1": 679.5,
"r_x2": 286.4,
"r_y2": 671.8,
"r_x3": 160.5,
"r_y3": 671.8,
"coord_origin": "TOPLEFT"
},
"text": "Winter Conference for Applications",
"orig": "Winter Conference for Applications",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 690.4,
"r_x1": 171.4,
"r_y1": 690.4,
"r_x2": 171.4,
"r_y2": 682.7,
"r_x3": 70.0,
"r_y3": 682.7,
"coord_origin": "TOPLEFT"
},
"text": "in Computer Vision (WACV)",
"orig": "in Computer Vision (WACV)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 171.4,
"r_y0": 690.7,
"r_x1": 212.8,
"r_y1": 690.7,
"r_x2": 212.8,
"r_y2": 682.6,
"r_x3": 171.4,
"r_y3": 682.6,
"coord_origin": "TOPLEFT"
},
"text": ", 2021. 2, 3",
"orig": ", 2021. 2, 3",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[36] Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and Nancy Xin Ru Wang. Global table extractor (gte): A framework for joint table identification and cell structure recognition using visual context. Winter Conference for Applications in Computer Vision (WACV) , 2021. 2, 3"
},
{
"label": "list_item",
"id": 8,
"page_no": 9,
"cluster": {
"id": 8,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 694.0,
"r": 286.4,
"b": 712.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 702.0,
"r_x1": 66.5,
"r_y1": 702.0,
"r_x2": 66.5,
"r_y2": 694.0,
"r_x3": 50.1,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "[37]",
"orig": "[37]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 69.0,
"r_y0": 702.0,
"r_x1": 81.0,
"r_y1": 702.0,
"r_x2": 81.0,
"r_y2": 694.0,
"r_x3": 69.0,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Xu",
"orig": "Xu",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 89.1,
"r_y0": 702.0,
"r_x1": 114.7,
"r_y1": 702.0,
"r_x2": 114.7,
"r_y2": 694.0,
"r_x3": 89.1,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Zhong,",
"orig": "Zhong,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 124.2,
"r_y0": 702.0,
"r_x1": 149.1,
"r_y1": 702.0,
"r_x2": 149.1,
"r_y2": 694.0,
"r_x3": 124.2,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Elaheh",
"orig": "Elaheh",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 157.2,
"r_y0": 702.0,
"r_x1": 209.4,
"r_y1": 702.0,
"r_x2": 209.4,
"r_y2": 694.0,
"r_x3": 157.2,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "ShafieiBavani,",
"orig": "ShafieiBavani,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 218.9,
"r_y0": 702.0,
"r_x1": 231.9,
"r_y1": 702.0,
"r_x2": 231.9,
"r_y2": 694.0,
"r_x3": 218.9,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 239.9,
"r_y0": 702.0,
"r_x1": 269.3,
"r_y1": 702.0,
"r_x2": 269.3,
"r_y2": 694.0,
"r_x3": 239.9,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Antonio",
"orig": "Antonio",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 277.4,
"r_y0": 702.0,
"r_x1": 286.4,
"r_y1": 702.0,
"r_x2": 286.4,
"r_y2": 694.0,
"r_x3": 277.4,
"r_y3": 694.0,
"coord_origin": "TOPLEFT"
},
"text": "Ji-",
"orig": "Ji-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 712.9,
"r_x1": 286.4,
"r_y1": 712.9,
"r_x2": 286.4,
"r_y2": 704.9,
"r_x3": 70.0,
"r_y3": 704.9,
"coord_origin": "TOPLEFT"
},
"text": "meno Yepes. Image-based table recognition: Data, model,",
"orig": "meno Yepes. Image-based table recognition: Data, model,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[37] Xu Zhong, Elaheh ShafieiBavani, and Antonio Jimeno Yepes. Image-based table recognition: Data, model,"
},
{
"label": "list_item",
"id": 14,
"page_no": 9,
"cluster": {
"id": 14,
"label": "list_item",
"bbox": {
"l": 328.8,
"t": 75.9,
"r": 545.1,
"b": 116.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.76,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 83.9,
"r_x1": 545.1,
"r_y1": 83.9,
"r_x2": 545.1,
"r_y2": 75.9,
"r_x3": 328.8,
"r_y3": 75.9,
"coord_origin": "TOPLEFT"
},
"text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas",
"orig": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 94.9,
"r_x1": 472.3,
"r_y1": 94.9,
"r_x2": 472.3,
"r_y2": 86.8,
"r_x3": 328.8,
"r_y3": 86.8,
"coord_origin": "TOPLEFT"
},
"text": "Brox, and Jan-Michael Frahm, editors,",
"orig": "Brox, and Jan-Michael Frahm, editors,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 475.9,
"r_y0": 94.7,
"r_x1": 545.1,
"r_y1": 94.7,
"r_x2": 545.1,
"r_y2": 86.9,
"r_x3": 475.9,
"r_y3": 86.9,
"coord_origin": "TOPLEFT"
},
"text": "Computer Vision -",
"orig": "Computer Vision -",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 105.6,
"r_x1": 371.9,
"r_y1": 105.6,
"r_x2": 371.9,
"r_y2": 97.9,
"r_x3": 328.8,
"r_y3": 97.9,
"coord_origin": "TOPLEFT"
},
"text": "ECCV 2020",
"orig": "ECCV 2020",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 371.9,
"r_y0": 105.8,
"r_x1": 545.1,
"r_y1": 105.8,
"r_x2": 545.1,
"r_y2": 97.8,
"r_x3": 371.9,
"r_y3": 97.8,
"coord_origin": "TOPLEFT"
},
"text": ", pages 564-580, Cham, 2020. Springer Interna-",
"orig": ", pages 564-580, Cham, 2020. Springer Interna-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 116.8,
"r_x1": 417.7,
"r_y1": 116.8,
"r_x2": 417.7,
"r_y2": 108.8,
"r_x3": 328.8,
"r_y3": 108.8,
"coord_origin": "TOPLEFT"
},
"text": "tional Publishing. 2, 3, 7",
"orig": "tional Publishing. 2, 3, 7",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas Brox, and Jan-Michael Frahm, editors, Computer Vision ECCV 2020 , pages 564-580, Cham, 2020. Springer International Publishing. 2, 3, 7"
},
{
"label": "list_item",
"id": 9,
"page_no": 9,
"cluster": {
"id": 9,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 120.7,
"r": 545.1,
"b": 161.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 128.7,
"r_x1": 324.3,
"r_y1": 128.7,
"r_x2": 324.3,
"r_y2": 120.7,
"r_x3": 308.9,
"r_y3": 120.7,
"coord_origin": "TOPLEFT"
},
"text": "[38]",
"orig": "[38]",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.7,
"r_y0": 128.7,
"r_x1": 545.1,
"r_y1": 128.7,
"r_x2": 545.1,
"r_y2": 120.7,
"r_x3": 326.7,
"r_y3": 120.7,
"coord_origin": "TOPLEFT"
},
"text": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-",
"orig": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Pub-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 139.7,
"r_x1": 545.1,
"r_y1": 139.7,
"r_x2": 545.1,
"r_y2": 131.7,
"r_x3": 328.8,
"r_y3": 131.7,
"coord_origin": "TOPLEFT"
},
"text": "laynet: Largest dataset ever for document layout analysis. In",
"orig": "laynet: Largest dataset ever for document layout analysis. In",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 150.4,
"r_x1": 545.1,
"r_y1": 150.4,
"r_x2": 545.1,
"r_y2": 142.7,
"r_x3": 328.8,
"r_y3": 142.7,
"coord_origin": "TOPLEFT"
},
"text": "2019 International Conference on Document Analysis and",
"orig": "2019 International Conference on Document Analysis and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 328.8,
"r_y0": 161.4,
"r_x1": 406.3,
"r_y1": 161.4,
"r_x2": 406.3,
"r_y2": 153.7,
"r_x3": 328.8,
"r_y3": 153.7,
"coord_origin": "TOPLEFT"
},
"text": "Recognition (ICDAR)",
"orig": "Recognition (ICDAR)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 406.3,
"r_y0": 161.6,
"r_x1": 506.2,
"r_y1": 161.6,
"r_x2": 506.2,
"r_y2": 153.6,
"r_x3": 406.3,
"r_y3": 153.6,
"coord_origin": "TOPLEFT"
},
"text": ", pages 1015-1022, 2019. 1",
"orig": ", pages 1015-1022, 2019. 1",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "[38] Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Publaynet: Largest dataset ever for document layout analysis. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 1015-1022, 2019. 1"
}
],
"headers": [
{
"label": "page_footer",
"id": 0,
"page_no": 9,
"cluster": {
"id": 0,
"label": "page_footer",
"bbox": {
"l": 292.6,
"t": 734.1,
"r": 302.6,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "10",
"orig": "10",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "10"
}
]
}
},
{
"page_no": 10,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 132.8,
"r_y0": 121.3,
"r_x1": 465.4,
"r_y1": 121.3,
"r_x2": 465.4,
"r_y2": 110.6,
"r_x3": 132.8,
"r_y3": 110.6,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer: Table Structure Understanding with Transformers",
"orig": "TableFormer: Table Structure Understanding with Transformers",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.2,
"r_y0": 135.5,
"r_x1": 375.0,
"r_y1": 135.5,
"r_x2": 375.0,
"r_y2": 122.3,
"r_x3": 220.2,
"r_y3": 122.3,
"coord_origin": "TOPLEFT"
},
"text": "Supplementary Material",
"orig": "Supplementary Material",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 171.9,
"r_x1": 57.1,
"r_y1": 171.9,
"r_x2": 57.1,
"r_y2": 161.2,
"r_x3": 50.1,
"r_y3": 161.2,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.4,
"r_y0": 171.9,
"r_x1": 176.0,
"r_y1": 171.9,
"r_x2": 176.0,
"r_y2": 161.2,
"r_x3": 66.4,
"r_y3": 161.2,
"coord_origin": "TOPLEFT"
},
"text": "Details on the datasets",
"orig": "Details on the datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 190.8,
"r_x1": 64.2,
"r_y1": 190.8,
"r_x2": 64.2,
"r_y2": 181.0,
"r_x3": 50.1,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "1.1.",
"orig": "1.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.6,
"r_y0": 190.8,
"r_x1": 150.4,
"r_y1": 190.8,
"r_x2": 150.4,
"r_y2": 181.0,
"r_x3": 73.6,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "Data preparation",
"orig": "Data preparation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 208.8,
"r_x1": 286.4,
"r_y1": 208.8,
"r_x2": 286.4,
"r_y2": 199.9,
"r_x3": 62.1,
"r_y3": 199.9,
"coord_origin": "TOPLEFT"
},
"text": "As a first step of our data preparation process, we have",
"orig": "As a first step of our data preparation process, we have",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 220.8,
"r_x1": 286.4,
"r_y1": 220.8,
"r_x2": 286.4,
"r_y2": 211.9,
"r_x3": 50.1,
"r_y3": 211.9,
"coord_origin": "TOPLEFT"
},
"text": "calculated statistics over the datasets across the following",
"orig": "calculated statistics over the datasets across the following",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 232.7,
"r_x1": 286.4,
"r_y1": 232.7,
"r_x2": 286.4,
"r_y2": 223.8,
"r_x3": 50.1,
"r_y3": 223.8,
"coord_origin": "TOPLEFT"
},
"text": "dimensions: (1) table size measured in the number of rows",
"orig": "dimensions: (1) table size measured in the number of rows",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 244.7,
"r_x1": 286.4,
"r_y1": 244.7,
"r_x2": 286.4,
"r_y2": 235.8,
"r_x3": 50.1,
"r_y3": 235.8,
"coord_origin": "TOPLEFT"
},
"text": "and columns, (2) complexity of the table, (3) strictness of",
"orig": "and columns, (2) complexity of the table, (3) strictness of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 256.6,
"r_x1": 286.4,
"r_y1": 256.6,
"r_x2": 286.4,
"r_y2": 247.7,
"r_x3": 50.1,
"r_y3": 247.7,
"coord_origin": "TOPLEFT"
},
"text": "the provided HTML structure and (4) completeness (i.e. no",
"orig": "the provided HTML structure and (4) completeness (i.e. no",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 268.6,
"r_x1": 286.4,
"r_y1": 268.6,
"r_x2": 286.4,
"r_y2": 259.7,
"r_x3": 50.1,
"r_y3": 259.7,
"coord_origin": "TOPLEFT"
},
"text": "omitted bounding boxes). A table is considered to be simple",
"orig": "omitted bounding boxes). A table is considered to be simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 280.6,
"r_x1": 286.4,
"r_y1": 280.6,
"r_x2": 286.4,
"r_y2": 271.7,
"r_x3": 50.1,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "if it does not contain row spans or column spans. Addition-",
"orig": "if it does not contain row spans or column spans. Addition-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 292.5,
"r_x1": 286.4,
"r_y1": 292.5,
"r_x2": 286.4,
"r_y2": 283.6,
"r_x3": 50.1,
"r_y3": 283.6,
"coord_origin": "TOPLEFT"
},
"text": "ally, a table has a strict HTML structure if every row has the",
"orig": "ally, a table has a strict HTML structure if every row has the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 304.5,
"r_x1": 286.4,
"r_y1": 304.5,
"r_x2": 286.4,
"r_y2": 295.6,
"r_x3": 50.1,
"r_y3": 295.6,
"coord_origin": "TOPLEFT"
},
"text": "same number of columns after taking into account any row",
"orig": "same number of columns after taking into account any row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 316.4,
"r_x1": 286.4,
"r_y1": 316.4,
"r_x2": 286.4,
"r_y2": 307.5,
"r_x3": 50.1,
"r_y3": 307.5,
"coord_origin": "TOPLEFT"
},
"text": "or column spans. Therefore a strict HTML structure looks",
"orig": "or column spans. Therefore a strict HTML structure looks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 328.4,
"r_x1": 286.4,
"r_y1": 328.4,
"r_x2": 286.4,
"r_y2": 319.5,
"r_x3": 50.1,
"r_y3": 319.5,
"coord_origin": "TOPLEFT"
},
"text": "always rectangular. However, HTML is a lenient encoding",
"orig": "always rectangular. However, HTML is a lenient encoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 340.3,
"r_x1": 286.4,
"r_y1": 340.3,
"r_x2": 286.4,
"r_y2": 331.4,
"r_x3": 50.1,
"r_y3": 331.4,
"coord_origin": "TOPLEFT"
},
"text": "format, i.e. tables with rows of different sizes might still",
"orig": "format, i.e. tables with rows of different sizes might still",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 352.3,
"r_x1": 286.4,
"r_y1": 352.3,
"r_x2": 286.4,
"r_y2": 343.4,
"r_x3": 50.1,
"r_y3": 343.4,
"coord_origin": "TOPLEFT"
},
"text": "be regarded as correct due to implicit display rules. These",
"orig": "be regarded as correct due to implicit display rules. These",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 364.2,
"r_x1": 286.4,
"r_y1": 364.2,
"r_x2": 286.4,
"r_y2": 355.3,
"r_x3": 50.1,
"r_y3": 355.3,
"coord_origin": "TOPLEFT"
},
"text": "implicit rules leave room for ambiguity, which we want to",
"orig": "implicit rules leave room for ambiguity, which we want to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 376.2,
"r_x1": 286.4,
"r_y1": 376.2,
"r_x2": 286.4,
"r_y2": 367.3,
"r_x3": 50.1,
"r_y3": 367.3,
"coord_origin": "TOPLEFT"
},
"text": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables",
"orig": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 388.2,
"r_x1": 230.8,
"r_y1": 388.2,
"r_x2": 230.8,
"r_y2": 379.2,
"r_x3": 50.1,
"r_y3": 379.2,
"coord_origin": "TOPLEFT"
},
"text": "where every row has exactly the same length.",
"orig": "where every row has exactly the same length.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 400.3,
"r_x1": 286.4,
"r_y1": 400.3,
"r_x2": 286.4,
"r_y2": 391.4,
"r_x3": 62.1,
"r_y3": 391.4,
"coord_origin": "TOPLEFT"
},
"text": "We have developed a technique that tries to derive a",
"orig": "We have developed a technique that tries to derive a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 412.3,
"r_x1": 286.4,
"r_y1": 412.3,
"r_x2": 286.4,
"r_y2": 403.4,
"r_x3": 50.1,
"r_y3": 403.4,
"coord_origin": "TOPLEFT"
},
"text": "missing bounding box out of its neighbors. As a first step,",
"orig": "missing bounding box out of its neighbors. As a first step,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 424.2,
"r_x1": 286.4,
"r_y1": 424.2,
"r_x2": 286.4,
"r_y2": 415.3,
"r_x3": 50.1,
"r_y3": 415.3,
"coord_origin": "TOPLEFT"
},
"text": "we use the annotation data to generate the most fine-grained",
"orig": "we use the annotation data to generate the most fine-grained",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 436.2,
"r_x1": 286.4,
"r_y1": 436.2,
"r_x2": 286.4,
"r_y2": 427.3,
"r_x3": 50.1,
"r_y3": 427.3,
"coord_origin": "TOPLEFT"
},
"text": "grid that covers the table structure. In case of strict HTML",
"orig": "grid that covers the table structure. In case of strict HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 448.1,
"r_x1": 286.4,
"r_y1": 448.1,
"r_x2": 286.4,
"r_y2": 439.2,
"r_x3": 50.1,
"r_y3": 439.2,
"coord_origin": "TOPLEFT"
},
"text": "tables, all grid squares are associated with some table cell",
"orig": "tables, all grid squares are associated with some table cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 460.1,
"r_x1": 286.4,
"r_y1": 460.1,
"r_x2": 286.4,
"r_y2": 451.2,
"r_x3": 50.1,
"r_y3": 451.2,
"coord_origin": "TOPLEFT"
},
"text": "and in the presence of table spans a cell extends across mul-",
"orig": "and in the presence of table spans a cell extends across mul-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 472.0,
"r_x1": 286.4,
"r_y1": 472.0,
"r_x2": 286.4,
"r_y2": 463.1,
"r_x3": 50.1,
"r_y3": 463.1,
"coord_origin": "TOPLEFT"
},
"text": "tiple grid squares. When enough bounding boxes are known",
"orig": "tiple grid squares. When enough bounding boxes are known",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 484.0,
"r_x1": 286.4,
"r_y1": 484.0,
"r_x2": 286.4,
"r_y2": 475.1,
"r_x3": 50.1,
"r_y3": 475.1,
"coord_origin": "TOPLEFT"
},
"text": "for a rectangular table, it is possible to compute the geo-",
"orig": "for a rectangular table, it is possible to compute the geo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 496.0,
"r_x1": 286.4,
"r_y1": 496.0,
"r_x2": 286.4,
"r_y2": 487.0,
"r_x3": 50.1,
"r_y3": 487.0,
"coord_origin": "TOPLEFT"
},
"text": "metrical border lines between the grid rows and columns.",
"orig": "metrical border lines between the grid rows and columns.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 507.9,
"r_x1": 286.4,
"r_y1": 507.9,
"r_x2": 286.4,
"r_y2": 499.0,
"r_x3": 50.1,
"r_y3": 499.0,
"coord_origin": "TOPLEFT"
},
"text": "Eventually this information is used to generate the missing",
"orig": "Eventually this information is used to generate the missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 519.9,
"r_x1": 286.4,
"r_y1": 519.9,
"r_x2": 286.4,
"r_y2": 511.0,
"r_x3": 50.1,
"r_y3": 511.0,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes. Additionally, the existence of unused grid",
"orig": "bounding boxes. Additionally, the existence of unused grid",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 531.8,
"r_x1": 286.4,
"r_y1": 531.8,
"r_x2": 286.4,
"r_y2": 522.9,
"r_x3": 50.1,
"r_y3": 522.9,
"coord_origin": "TOPLEFT"
},
"text": "squares indicates that the table rows have unequal number",
"orig": "squares indicates that the table rows have unequal number",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 543.8,
"r_x1": 286.4,
"r_y1": 543.8,
"r_x2": 286.4,
"r_y2": 534.9,
"r_x3": 50.1,
"r_y3": 534.9,
"coord_origin": "TOPLEFT"
},
"text": "of columns and the overall structure is non-strict. The gen-",
"orig": "of columns and the overall structure is non-strict. The gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 555.7,
"r_x1": 286.4,
"r_y1": 555.7,
"r_x2": 286.4,
"r_y2": 546.8,
"r_x3": 50.1,
"r_y3": 546.8,
"coord_origin": "TOPLEFT"
},
"text": "eration of missing bounding boxes for non-strict HTML ta-",
"orig": "eration of missing bounding boxes for non-strict HTML ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 567.7,
"r_x1": 257.5,
"r_y1": 567.7,
"r_x2": 257.5,
"r_y2": 558.8,
"r_x3": 50.1,
"r_y3": 558.8,
"coord_origin": "TOPLEFT"
},
"text": "bles is ambiguous and therefore quite challenging.",
"orig": "bles is ambiguous and therefore quite challenging.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.9,
"r_y0": 567.7,
"r_x1": 286.4,
"r_y1": 567.7,
"r_x2": 286.4,
"r_y2": 558.8,
"r_x3": 263.9,
"r_y3": 558.8,
"coord_origin": "TOPLEFT"
},
"text": "Thus,",
"orig": "Thus,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 579.6,
"r_x1": 286.4,
"r_y1": 579.6,
"r_x2": 286.4,
"r_y2": 570.7,
"r_x3": 50.1,
"r_y3": 570.7,
"coord_origin": "TOPLEFT"
},
"text": "we have decided to simply discard those tables. In case of",
"orig": "we have decided to simply discard those tables. In case of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 591.6,
"r_x1": 286.4,
"r_y1": 591.6,
"r_x2": 286.4,
"r_y2": 582.7,
"r_x3": 50.1,
"r_y3": 582.7,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet we have computed missing bounding boxes for",
"orig": "PubTabNet we have computed missing bounding boxes for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 603.5,
"r_x1": 286.4,
"r_y1": 603.5,
"r_x2": 286.4,
"r_y2": 594.6,
"r_x3": 50.1,
"r_y3": 594.6,
"coord_origin": "TOPLEFT"
},
"text": "48% of the simple and 69% of the complex tables. Regard-",
"orig": "48% of the simple and 69% of the complex tables. Regard-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 615.5,
"r_x1": 286.4,
"r_y1": 615.5,
"r_x2": 286.4,
"r_y2": 606.6,
"r_x3": 50.1,
"r_y3": 606.6,
"coord_origin": "TOPLEFT"
},
"text": "ing FinTabNet, 68% of the simple and 98% of the complex",
"orig": "ing FinTabNet, 68% of the simple and 98% of the complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 627.5,
"r_x1": 242.3,
"r_y1": 627.5,
"r_x2": 242.3,
"r_y2": 618.6,
"r_x3": 50.1,
"r_y3": 618.6,
"coord_origin": "TOPLEFT"
},
"text": "tables require the generation of bounding boxes.",
"orig": "tables require the generation of bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 639.6,
"r_x1": 286.4,
"r_y1": 639.6,
"r_x2": 286.4,
"r_y2": 630.7,
"r_x3": 62.1,
"r_y3": 630.7,
"coord_origin": "TOPLEFT"
},
"text": "Figure 7 illustrates the distribution of the tables across",
"orig": "Figure 7 illustrates the distribution of the tables across",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 651.6,
"r_x1": 179.9,
"r_y1": 651.6,
"r_x2": 179.9,
"r_y2": 642.7,
"r_x3": 50.1,
"r_y3": 642.7,
"coord_origin": "TOPLEFT"
},
"text": "different dimensions per dataset.",
"orig": "different dimensions per dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 672.2,
"r_x1": 64.3,
"r_y1": 672.2,
"r_x2": 64.3,
"r_y2": 662.4,
"r_x3": 50.1,
"r_y3": 662.4,
"coord_origin": "TOPLEFT"
},
"text": "1.2.",
"orig": "1.2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.8,
"r_y0": 672.2,
"r_x1": 153.6,
"r_y1": 672.2,
"r_x2": 153.6,
"r_y2": 662.4,
"r_x3": 73.8,
"r_y3": 662.4,
"coord_origin": "TOPLEFT"
},
"text": "Synthetic datasets",
"orig": "Synthetic datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 690.2,
"r_x1": 286.4,
"r_y1": 690.2,
"r_x2": 286.4,
"r_y2": 681.3,
"r_x3": 62.1,
"r_y3": 681.3,
"coord_origin": "TOPLEFT"
},
"text": "Aiming to train and evaluate our models in a broader",
"orig": "Aiming to train and evaluate our models in a broader",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 702.2,
"r_x1": 286.4,
"r_y1": 702.2,
"r_x2": 286.4,
"r_y2": 693.3,
"r_x3": 50.1,
"r_y3": 693.3,
"coord_origin": "TOPLEFT"
},
"text": "spectrum of table data we have synthesized four types of",
"orig": "spectrum of table data we have synthesized four types of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 714.1,
"r_x1": 84.1,
"r_y1": 714.1,
"r_x2": 84.1,
"r_y2": 705.2,
"r_x3": 50.1,
"r_y3": 705.2,
"coord_origin": "TOPLEFT"
},
"text": "datasets.",
"orig": "datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.2,
"r_y0": 714.1,
"r_x1": 286.4,
"r_y1": 714.1,
"r_x2": 286.4,
"r_y2": 705.2,
"r_x3": 91.2,
"r_y3": 705.2,
"coord_origin": "TOPLEFT"
},
"text": "Each one contains tables with different appear-",
"orig": "Each one contains tables with different appear-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 171.6,
"r_x1": 545.1,
"r_y1": 171.6,
"r_x2": 545.1,
"r_y2": 162.7,
"r_x3": 308.9,
"r_y3": 162.7,
"coord_origin": "TOPLEFT"
},
"text": "ances in regard to their size, structure, style and content.",
"orig": "ances in regard to their size, structure, style and content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 183.5,
"r_x1": 545.1,
"r_y1": 183.5,
"r_x2": 545.1,
"r_y2": 174.6,
"r_x3": 308.9,
"r_y3": 174.6,
"coord_origin": "TOPLEFT"
},
"text": "Every synthetic dataset contains 150k examples, summing",
"orig": "Every synthetic dataset contains 150k examples, summing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 195.5,
"r_x1": 545.1,
"r_y1": 195.5,
"r_x2": 545.1,
"r_y2": 186.6,
"r_x3": 308.9,
"r_y3": 186.6,
"coord_origin": "TOPLEFT"
},
"text": "up to 600k synthetic examples. All datasets are divided into",
"orig": "up to 600k synthetic examples. All datasets are divided into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 207.4,
"r_x1": 484.1,
"r_y1": 207.4,
"r_x2": 484.1,
"r_y2": 198.5,
"r_x3": 308.9,
"r_y3": 198.5,
"coord_origin": "TOPLEFT"
},
"text": "Train, Test and Val splits (80%, 10%, 10%).",
"orig": "Train, Test and Val splits (80%, 10%, 10%).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 220.1,
"r_x1": 545.1,
"r_y1": 220.1,
"r_x2": 545.1,
"r_y2": 211.2,
"r_x3": 320.8,
"r_y3": 211.2,
"coord_origin": "TOPLEFT"
},
"text": "The process of generating a synthetic dataset can be de-",
"orig": "The process of generating a synthetic dataset can be de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 232.1,
"r_x1": 448.1,
"r_y1": 232.1,
"r_x2": 448.1,
"r_y2": 223.2,
"r_x3": 308.9,
"r_y3": 223.2,
"coord_origin": "TOPLEFT"
},
"text": "composed into the following steps:",
"orig": "composed into the following steps:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 244.8,
"r_x1": 328.3,
"r_y1": 244.8,
"r_x2": 328.3,
"r_y2": 235.9,
"r_x3": 320.8,
"r_y3": 235.9,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 335.4,
"r_y0": 244.8,
"r_x1": 545.1,
"r_y1": 244.8,
"r_x2": 545.1,
"r_y2": 235.9,
"r_x3": 335.4,
"r_y3": 235.9,
"coord_origin": "TOPLEFT"
},
"text": "Prepare styling and content templates: The styling",
"orig": "Prepare styling and content templates: The styling",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 256.8,
"r_x1": 545.1,
"r_y1": 256.8,
"r_x2": 545.1,
"r_y2": 247.9,
"r_x3": 308.9,
"r_y3": 247.9,
"coord_origin": "TOPLEFT"
},
"text": "templates have been manually designed and organized into",
"orig": "templates have been manually designed and organized into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 268.7,
"r_x1": 545.1,
"r_y1": 268.7,
"r_x2": 545.1,
"r_y2": 259.8,
"r_x3": 308.9,
"r_y3": 259.8,
"coord_origin": "TOPLEFT"
},
"text": "groups of scope specific appearances (e.g. financial data,",
"orig": "groups of scope specific appearances (e.g. financial data,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 280.7,
"r_x1": 393.4,
"r_y1": 280.7,
"r_x2": 393.4,
"r_y2": 271.8,
"r_x3": 308.9,
"r_y3": 271.8,
"coord_origin": "TOPLEFT"
},
"text": "marketing data, etc.)",
"orig": "marketing data, etc.)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.1,
"r_y0": 280.7,
"r_x1": 545.1,
"r_y1": 280.7,
"r_x2": 545.1,
"r_y2": 271.8,
"r_x3": 400.1,
"r_y3": 271.8,
"coord_origin": "TOPLEFT"
},
"text": "Additionally, we have prepared cu-",
"orig": "Additionally, we have prepared cu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 292.6,
"r_x1": 545.1,
"r_y1": 292.6,
"r_x2": 545.1,
"r_y2": 283.7,
"r_x3": 308.9,
"r_y3": 283.7,
"coord_origin": "TOPLEFT"
},
"text": "rated collections of content templates by extracting the most",
"orig": "rated collections of content templates by extracting the most",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 304.6,
"r_x1": 545.1,
"r_y1": 304.6,
"r_x2": 545.1,
"r_y2": 295.7,
"r_x3": 308.9,
"r_y3": 295.7,
"coord_origin": "TOPLEFT"
},
"text": "frequently used terms out of non-synthetic datasets (e.g.",
"orig": "frequently used terms out of non-synthetic datasets (e.g.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 316.5,
"r_x1": 425.7,
"r_y1": 316.5,
"r_x2": 425.7,
"r_y2": 307.6,
"r_x3": 308.9,
"r_y3": 307.6,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet, FinTabNet, etc.).",
"orig": "PubTabNet, FinTabNet, etc.).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 329.3,
"r_x1": 328.5,
"r_y1": 329.3,
"r_x2": 328.5,
"r_y2": 320.4,
"r_x3": 320.8,
"r_y3": 320.4,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.1,
"r_y0": 329.3,
"r_x1": 545.1,
"r_y1": 329.3,
"r_x2": 545.1,
"r_y2": 320.4,
"r_x3": 331.1,
"r_y3": 320.4,
"coord_origin": "TOPLEFT"
},
"text": "Generate table structures: The structure of each syn-",
"orig": "Generate table structures: The structure of each syn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 341.2,
"r_x1": 545.1,
"r_y1": 341.2,
"r_x2": 545.1,
"r_y2": 332.3,
"r_x3": 308.9,
"r_y3": 332.3,
"coord_origin": "TOPLEFT"
},
"text": "thetic dataset assumes a horizontal table header which po-",
"orig": "thetic dataset assumes a horizontal table header which po-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 353.2,
"r_x1": 545.1,
"r_y1": 353.2,
"r_x2": 545.1,
"r_y2": 344.3,
"r_x3": 308.9,
"r_y3": 344.3,
"coord_origin": "TOPLEFT"
},
"text": "tentially spans over multiple rows and a table body that",
"orig": "tentially spans over multiple rows and a table body that",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 365.1,
"r_x1": 545.1,
"r_y1": 365.1,
"r_x2": 545.1,
"r_y2": 356.2,
"r_x3": 308.9,
"r_y3": 356.2,
"coord_origin": "TOPLEFT"
},
"text": "may contain a combination of row spans and column spans.",
"orig": "may contain a combination of row spans and column spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 377.1,
"r_x1": 545.1,
"r_y1": 377.1,
"r_x2": 545.1,
"r_y2": 368.2,
"r_x3": 308.9,
"r_y3": 368.2,
"coord_origin": "TOPLEFT"
},
"text": "However, spans are not allowed to cross the header - body",
"orig": "However, spans are not allowed to cross the header - body",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 389.0,
"r_x1": 545.1,
"r_y1": 389.0,
"r_x2": 545.1,
"r_y2": 380.1,
"r_x3": 308.9,
"r_y3": 380.1,
"coord_origin": "TOPLEFT"
},
"text": "boundary. The table structure is described by the parame-",
"orig": "boundary. The table structure is described by the parame-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 401.0,
"r_x1": 545.1,
"r_y1": 401.0,
"r_x2": 545.1,
"r_y2": 392.1,
"r_x3": 308.9,
"r_y3": 392.1,
"coord_origin": "TOPLEFT"
},
"text": "ters: Total number of table rows and columns, number of",
"orig": "ters: Total number of table rows and columns, number of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 412.9,
"r_x1": 545.1,
"r_y1": 412.9,
"r_x2": 545.1,
"r_y2": 404.0,
"r_x3": 308.9,
"r_y3": 404.0,
"coord_origin": "TOPLEFT"
},
"text": "header rows, type of spans (header only spans, row only",
"orig": "header rows, type of spans (header only spans, row only",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 424.9,
"r_x1": 545.1,
"r_y1": 424.9,
"r_x2": 545.1,
"r_y2": 416.0,
"r_x3": 308.9,
"r_y3": 416.0,
"coord_origin": "TOPLEFT"
},
"text": "spans, column only spans, both row and column spans),",
"orig": "spans, column only spans, both row and column spans),",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 436.9,
"r_x1": 545.1,
"r_y1": 436.9,
"r_x2": 545.1,
"r_y2": 427.9,
"r_x3": 308.9,
"r_y3": 427.9,
"coord_origin": "TOPLEFT"
},
"text": "maximum span size and the ratio of the table area covered",
"orig": "maximum span size and the ratio of the table area covered",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 448.8,
"r_x1": 345.9,
"r_y1": 448.8,
"r_x2": 345.9,
"r_y2": 439.9,
"r_x3": 308.9,
"r_y3": 439.9,
"coord_origin": "TOPLEFT"
},
"text": "by spans.",
"orig": "by spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 461.5,
"r_x1": 328.3,
"r_y1": 461.5,
"r_x2": 328.3,
"r_y2": 452.6,
"r_x3": 320.8,
"r_y3": 452.6,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.8,
"r_y0": 461.5,
"r_x1": 485.8,
"r_y1": 461.5,
"r_x2": 485.8,
"r_y2": 452.6,
"r_x3": 330.8,
"r_y3": 452.6,
"coord_origin": "TOPLEFT"
},
"text": "Generate content: Based on the dataset",
"orig": "Generate content: Based on the dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.1,
"r_y0": 461.3,
"r_x1": 511.9,
"r_y1": 461.3,
"r_x2": 511.9,
"r_y2": 452.7,
"r_x3": 488.1,
"r_y3": 452.7,
"coord_origin": "TOPLEFT"
},
"text": "theme",
"orig": "theme",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.9,
"r_y0": 461.5,
"r_x1": 545.1,
"r_y1": 461.5,
"r_x2": 545.1,
"r_y2": 452.6,
"r_x3": 511.9,
"r_y3": 452.6,
"coord_origin": "TOPLEFT"
},
"text": ", a set of",
"orig": ", a set of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 473.5,
"r_x1": 545.1,
"r_y1": 473.5,
"r_x2": 545.1,
"r_y2": 464.6,
"r_x3": 308.9,
"r_y3": 464.6,
"coord_origin": "TOPLEFT"
},
"text": "suitable content templates is chosen first. Then, this content",
"orig": "suitable content templates is chosen first. Then, this content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 485.4,
"r_x1": 545.1,
"r_y1": 485.4,
"r_x2": 545.1,
"r_y2": 476.5,
"r_x3": 308.9,
"r_y3": 476.5,
"coord_origin": "TOPLEFT"
},
"text": "can be combined with purely random text to produce the",
"orig": "can be combined with purely random text to produce the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 497.4,
"r_x1": 379.1,
"r_y1": 497.4,
"r_x2": 379.1,
"r_y2": 488.5,
"r_x3": 308.9,
"r_y3": 488.5,
"coord_origin": "TOPLEFT"
},
"text": "synthetic content.",
"orig": "synthetic content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 510.1,
"r_x1": 328.7,
"r_y1": 510.1,
"r_x2": 328.7,
"r_y2": 501.2,
"r_x3": 320.8,
"r_y3": 501.2,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.3,
"r_y0": 510.1,
"r_x1": 545.1,
"r_y1": 510.1,
"r_x2": 545.1,
"r_y2": 501.2,
"r_x3": 331.3,
"r_y3": 501.2,
"coord_origin": "TOPLEFT"
},
"text": "Apply styling templates: Depending on the domain",
"orig": "Apply styling templates: Depending on the domain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 522.1,
"r_x1": 545.1,
"r_y1": 522.1,
"r_x2": 545.1,
"r_y2": 513.2,
"r_x3": 308.9,
"r_y3": 513.2,
"coord_origin": "TOPLEFT"
},
"text": "of the synthetic dataset, a set of styling templates is first",
"orig": "of the synthetic dataset, a set of styling templates is first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 534.0,
"r_x1": 384.3,
"r_y1": 534.0,
"r_x2": 384.3,
"r_y2": 525.1,
"r_x3": 308.9,
"r_y3": 525.1,
"coord_origin": "TOPLEFT"
},
"text": "manually selected.",
"orig": "manually selected.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.3,
"r_y0": 534.0,
"r_x1": 545.1,
"r_y1": 534.0,
"r_x2": 545.1,
"r_y2": 525.1,
"r_x3": 391.3,
"r_y3": 525.1,
"coord_origin": "TOPLEFT"
},
"text": "Then, a style is randomly selected to",
"orig": "Then, a style is randomly selected to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 546.0,
"r_x1": 496.2,
"r_y1": 546.0,
"r_x2": 496.2,
"r_y2": 537.1,
"r_x3": 308.9,
"r_y3": 537.1,
"coord_origin": "TOPLEFT"
},
"text": "format the appearance of the synthesized table.",
"orig": "format the appearance of the synthesized table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 558.7,
"r_x1": 328.3,
"r_y1": 558.7,
"r_x2": 328.3,
"r_y2": 549.8,
"r_x3": 320.8,
"r_y3": 549.8,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 335.4,
"r_y0": 558.7,
"r_x1": 545.1,
"r_y1": 558.7,
"r_x2": 545.1,
"r_y2": 549.8,
"r_x3": 335.4,
"r_y3": 549.8,
"coord_origin": "TOPLEFT"
},
"text": "Render the complete tables: The synthetic table is",
"orig": "Render the complete tables: The synthetic table is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 570.6,
"r_x1": 545.1,
"r_y1": 570.6,
"r_x2": 545.1,
"r_y2": 561.7,
"r_x3": 308.9,
"r_y3": 561.7,
"coord_origin": "TOPLEFT"
},
"text": "finally rendered by a web browser engine to generate the",
"orig": "finally rendered by a web browser engine to generate the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 582.6,
"r_x1": 545.1,
"r_y1": 582.6,
"r_x2": 545.1,
"r_y2": 573.7,
"r_x3": 308.9,
"r_y3": 573.7,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes for each table cell. A batching technique is",
"orig": "bounding boxes for each table cell. A batching technique is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 594.5,
"r_x1": 545.1,
"r_y1": 594.5,
"r_x2": 545.1,
"r_y2": 585.6,
"r_x3": 308.9,
"r_y3": 585.6,
"coord_origin": "TOPLEFT"
},
"text": "utilized to optimize the runtime overhead of the rendering",
"orig": "utilized to optimize the runtime overhead of the rendering",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 606.5,
"r_x1": 341.2,
"r_y1": 606.5,
"r_x2": 341.2,
"r_y2": 597.6,
"r_x3": 308.9,
"r_y3": 597.6,
"coord_origin": "TOPLEFT"
},
"text": "process.",
"orig": "process.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 633.0,
"r_x1": 316.8,
"r_y1": 633.0,
"r_x2": 316.8,
"r_y2": 622.3,
"r_x3": 308.9,
"r_y3": 622.3,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.3,
"r_y0": 633.0,
"r_x1": 545.1,
"r_y1": 633.0,
"r_x2": 545.1,
"r_y2": 622.3,
"r_x3": 327.3,
"r_y3": 622.3,
"coord_origin": "TOPLEFT"
},
"text": "Prediction post-processing for PDF docu-",
"orig": "Prediction post-processing for PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 647.0,
"r_x1": 357.3,
"r_y1": 647.0,
"r_x2": 357.3,
"r_y2": 636.2,
"r_x3": 326.8,
"r_y3": 636.2,
"coord_origin": "TOPLEFT"
},
"text": "ments",
"orig": "ments",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 666.3,
"r_x1": 545.1,
"r_y1": 666.3,
"r_x2": 545.1,
"r_y2": 657.4,
"r_x3": 320.8,
"r_y3": 657.4,
"coord_origin": "TOPLEFT"
},
"text": "Although TableFormer can predict the table structure and",
"orig": "Although TableFormer can predict the table structure and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 678.3,
"r_x1": 545.1,
"r_y1": 678.3,
"r_x2": 545.1,
"r_y2": 669.4,
"r_x3": 308.9,
"r_y3": 669.4,
"coord_origin": "TOPLEFT"
},
"text": "the bounding boxes for tables recognized inside PDF docu-",
"orig": "the bounding boxes for tables recognized inside PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 690.2,
"r_x1": 545.1,
"r_y1": 690.2,
"r_x2": 545.1,
"r_y2": 681.3,
"r_x3": 308.9,
"r_y3": 681.3,
"coord_origin": "TOPLEFT"
},
"text": "ments, this is not enough when a full reconstruction of the",
"orig": "ments, this is not enough when a full reconstruction of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 702.2,
"r_x1": 545.1,
"r_y1": 702.2,
"r_x2": 545.1,
"r_y2": 693.3,
"r_x3": 308.9,
"r_y3": 693.3,
"coord_origin": "TOPLEFT"
},
"text": "original table is required. This happens mainly due the fol-",
"orig": "original table is required. This happens mainly due the fol-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 714.1,
"r_x1": 371.4,
"r_y1": 714.1,
"r_x2": 371.4,
"r_y2": 705.2,
"r_x3": 308.9,
"r_y3": 705.2,
"coord_origin": "TOPLEFT"
},
"text": "lowing reasons:",
"orig": "lowing reasons:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 18,
"label": "section_header",
"bbox": {
"l": 132.8,
"t": 110.6,
"r": 465.4,
"b": 135.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.65,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 132.8,
"r_y0": 121.3,
"r_x1": 465.4,
"r_y1": 121.3,
"r_x2": 465.4,
"r_y2": 110.6,
"r_x3": 132.8,
"r_y3": 110.6,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer: Table Structure Understanding with Transformers",
"orig": "TableFormer: Table Structure Understanding with Transformers",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.2,
"r_y0": 135.5,
"r_x1": 375.0,
"r_y1": 135.5,
"r_x2": 375.0,
"r_y2": 122.3,
"r_x3": 220.2,
"r_y3": 122.3,
"coord_origin": "TOPLEFT"
},
"text": "Supplementary Material",
"orig": "Supplementary Material",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 13,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 161.2,
"r": 176.0,
"b": 171.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 171.9,
"r_x1": 57.1,
"r_y1": 171.9,
"r_x2": 57.1,
"r_y2": 161.2,
"r_x3": 50.1,
"r_y3": 161.2,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.4,
"r_y0": 171.9,
"r_x1": 176.0,
"r_y1": 171.9,
"r_x2": 176.0,
"r_y2": 161.2,
"r_x3": 66.4,
"r_y3": 161.2,
"coord_origin": "TOPLEFT"
},
"text": "Details on the datasets",
"orig": "Details on the datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 11,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 181.0,
"r": 150.4,
"b": 190.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 190.8,
"r_x1": 64.2,
"r_y1": 190.8,
"r_x2": 64.2,
"r_y2": 181.0,
"r_x3": 50.1,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "1.1.",
"orig": "1.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.6,
"r_y0": 190.8,
"r_x1": 150.4,
"r_y1": 190.8,
"r_x2": 150.4,
"r_y2": 181.0,
"r_x3": 73.6,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "Data preparation",
"orig": "Data preparation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 0,
"label": "text",
"bbox": {
"l": 50.1,
"t": 199.9,
"r": 286.4,
"b": 388.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 208.8,
"r_x1": 286.4,
"r_y1": 208.8,
"r_x2": 286.4,
"r_y2": 199.9,
"r_x3": 62.1,
"r_y3": 199.9,
"coord_origin": "TOPLEFT"
},
"text": "As a first step of our data preparation process, we have",
"orig": "As a first step of our data preparation process, we have",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 220.8,
"r_x1": 286.4,
"r_y1": 220.8,
"r_x2": 286.4,
"r_y2": 211.9,
"r_x3": 50.1,
"r_y3": 211.9,
"coord_origin": "TOPLEFT"
},
"text": "calculated statistics over the datasets across the following",
"orig": "calculated statistics over the datasets across the following",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 232.7,
"r_x1": 286.4,
"r_y1": 232.7,
"r_x2": 286.4,
"r_y2": 223.8,
"r_x3": 50.1,
"r_y3": 223.8,
"coord_origin": "TOPLEFT"
},
"text": "dimensions: (1) table size measured in the number of rows",
"orig": "dimensions: (1) table size measured in the number of rows",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 244.7,
"r_x1": 286.4,
"r_y1": 244.7,
"r_x2": 286.4,
"r_y2": 235.8,
"r_x3": 50.1,
"r_y3": 235.8,
"coord_origin": "TOPLEFT"
},
"text": "and columns, (2) complexity of the table, (3) strictness of",
"orig": "and columns, (2) complexity of the table, (3) strictness of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 256.6,
"r_x1": 286.4,
"r_y1": 256.6,
"r_x2": 286.4,
"r_y2": 247.7,
"r_x3": 50.1,
"r_y3": 247.7,
"coord_origin": "TOPLEFT"
},
"text": "the provided HTML structure and (4) completeness (i.e. no",
"orig": "the provided HTML structure and (4) completeness (i.e. no",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 268.6,
"r_x1": 286.4,
"r_y1": 268.6,
"r_x2": 286.4,
"r_y2": 259.7,
"r_x3": 50.1,
"r_y3": 259.7,
"coord_origin": "TOPLEFT"
},
"text": "omitted bounding boxes). A table is considered to be simple",
"orig": "omitted bounding boxes). A table is considered to be simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 280.6,
"r_x1": 286.4,
"r_y1": 280.6,
"r_x2": 286.4,
"r_y2": 271.7,
"r_x3": 50.1,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "if it does not contain row spans or column spans. Addition-",
"orig": "if it does not contain row spans or column spans. Addition-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 292.5,
"r_x1": 286.4,
"r_y1": 292.5,
"r_x2": 286.4,
"r_y2": 283.6,
"r_x3": 50.1,
"r_y3": 283.6,
"coord_origin": "TOPLEFT"
},
"text": "ally, a table has a strict HTML structure if every row has the",
"orig": "ally, a table has a strict HTML structure if every row has the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 304.5,
"r_x1": 286.4,
"r_y1": 304.5,
"r_x2": 286.4,
"r_y2": 295.6,
"r_x3": 50.1,
"r_y3": 295.6,
"coord_origin": "TOPLEFT"
},
"text": "same number of columns after taking into account any row",
"orig": "same number of columns after taking into account any row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 316.4,
"r_x1": 286.4,
"r_y1": 316.4,
"r_x2": 286.4,
"r_y2": 307.5,
"r_x3": 50.1,
"r_y3": 307.5,
"coord_origin": "TOPLEFT"
},
"text": "or column spans. Therefore a strict HTML structure looks",
"orig": "or column spans. Therefore a strict HTML structure looks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 328.4,
"r_x1": 286.4,
"r_y1": 328.4,
"r_x2": 286.4,
"r_y2": 319.5,
"r_x3": 50.1,
"r_y3": 319.5,
"coord_origin": "TOPLEFT"
},
"text": "always rectangular. However, HTML is a lenient encoding",
"orig": "always rectangular. However, HTML is a lenient encoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 340.3,
"r_x1": 286.4,
"r_y1": 340.3,
"r_x2": 286.4,
"r_y2": 331.4,
"r_x3": 50.1,
"r_y3": 331.4,
"coord_origin": "TOPLEFT"
},
"text": "format, i.e. tables with rows of different sizes might still",
"orig": "format, i.e. tables with rows of different sizes might still",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 352.3,
"r_x1": 286.4,
"r_y1": 352.3,
"r_x2": 286.4,
"r_y2": 343.4,
"r_x3": 50.1,
"r_y3": 343.4,
"coord_origin": "TOPLEFT"
},
"text": "be regarded as correct due to implicit display rules. These",
"orig": "be regarded as correct due to implicit display rules. These",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 364.2,
"r_x1": 286.4,
"r_y1": 364.2,
"r_x2": 286.4,
"r_y2": 355.3,
"r_x3": 50.1,
"r_y3": 355.3,
"coord_origin": "TOPLEFT"
},
"text": "implicit rules leave room for ambiguity, which we want to",
"orig": "implicit rules leave room for ambiguity, which we want to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 376.2,
"r_x1": 286.4,
"r_y1": 376.2,
"r_x2": 286.4,
"r_y2": 367.3,
"r_x3": 50.1,
"r_y3": 367.3,
"coord_origin": "TOPLEFT"
},
"text": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables",
"orig": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 388.2,
"r_x1": 230.8,
"r_y1": 388.2,
"r_x2": 230.8,
"r_y2": 379.2,
"r_x3": 50.1,
"r_y3": 379.2,
"coord_origin": "TOPLEFT"
},
"text": "where every row has exactly the same length.",
"orig": "where every row has exactly the same length.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "text",
"bbox": {
"l": 50.1,
"t": 391.4,
"r": 286.4,
"b": 627.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 400.3,
"r_x1": 286.4,
"r_y1": 400.3,
"r_x2": 286.4,
"r_y2": 391.4,
"r_x3": 62.1,
"r_y3": 391.4,
"coord_origin": "TOPLEFT"
},
"text": "We have developed a technique that tries to derive a",
"orig": "We have developed a technique that tries to derive a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 412.3,
"r_x1": 286.4,
"r_y1": 412.3,
"r_x2": 286.4,
"r_y2": 403.4,
"r_x3": 50.1,
"r_y3": 403.4,
"coord_origin": "TOPLEFT"
},
"text": "missing bounding box out of its neighbors. As a first step,",
"orig": "missing bounding box out of its neighbors. As a first step,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 424.2,
"r_x1": 286.4,
"r_y1": 424.2,
"r_x2": 286.4,
"r_y2": 415.3,
"r_x3": 50.1,
"r_y3": 415.3,
"coord_origin": "TOPLEFT"
},
"text": "we use the annotation data to generate the most fine-grained",
"orig": "we use the annotation data to generate the most fine-grained",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 436.2,
"r_x1": 286.4,
"r_y1": 436.2,
"r_x2": 286.4,
"r_y2": 427.3,
"r_x3": 50.1,
"r_y3": 427.3,
"coord_origin": "TOPLEFT"
},
"text": "grid that covers the table structure. In case of strict HTML",
"orig": "grid that covers the table structure. In case of strict HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 448.1,
"r_x1": 286.4,
"r_y1": 448.1,
"r_x2": 286.4,
"r_y2": 439.2,
"r_x3": 50.1,
"r_y3": 439.2,
"coord_origin": "TOPLEFT"
},
"text": "tables, all grid squares are associated with some table cell",
"orig": "tables, all grid squares are associated with some table cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 460.1,
"r_x1": 286.4,
"r_y1": 460.1,
"r_x2": 286.4,
"r_y2": 451.2,
"r_x3": 50.1,
"r_y3": 451.2,
"coord_origin": "TOPLEFT"
},
"text": "and in the presence of table spans a cell extends across mul-",
"orig": "and in the presence of table spans a cell extends across mul-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 472.0,
"r_x1": 286.4,
"r_y1": 472.0,
"r_x2": 286.4,
"r_y2": 463.1,
"r_x3": 50.1,
"r_y3": 463.1,
"coord_origin": "TOPLEFT"
},
"text": "tiple grid squares. When enough bounding boxes are known",
"orig": "tiple grid squares. When enough bounding boxes are known",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 484.0,
"r_x1": 286.4,
"r_y1": 484.0,
"r_x2": 286.4,
"r_y2": 475.1,
"r_x3": 50.1,
"r_y3": 475.1,
"coord_origin": "TOPLEFT"
},
"text": "for a rectangular table, it is possible to compute the geo-",
"orig": "for a rectangular table, it is possible to compute the geo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 496.0,
"r_x1": 286.4,
"r_y1": 496.0,
"r_x2": 286.4,
"r_y2": 487.0,
"r_x3": 50.1,
"r_y3": 487.0,
"coord_origin": "TOPLEFT"
},
"text": "metrical border lines between the grid rows and columns.",
"orig": "metrical border lines between the grid rows and columns.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 507.9,
"r_x1": 286.4,
"r_y1": 507.9,
"r_x2": 286.4,
"r_y2": 499.0,
"r_x3": 50.1,
"r_y3": 499.0,
"coord_origin": "TOPLEFT"
},
"text": "Eventually this information is used to generate the missing",
"orig": "Eventually this information is used to generate the missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 519.9,
"r_x1": 286.4,
"r_y1": 519.9,
"r_x2": 286.4,
"r_y2": 511.0,
"r_x3": 50.1,
"r_y3": 511.0,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes. Additionally, the existence of unused grid",
"orig": "bounding boxes. Additionally, the existence of unused grid",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 531.8,
"r_x1": 286.4,
"r_y1": 531.8,
"r_x2": 286.4,
"r_y2": 522.9,
"r_x3": 50.1,
"r_y3": 522.9,
"coord_origin": "TOPLEFT"
},
"text": "squares indicates that the table rows have unequal number",
"orig": "squares indicates that the table rows have unequal number",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 543.8,
"r_x1": 286.4,
"r_y1": 543.8,
"r_x2": 286.4,
"r_y2": 534.9,
"r_x3": 50.1,
"r_y3": 534.9,
"coord_origin": "TOPLEFT"
},
"text": "of columns and the overall structure is non-strict. The gen-",
"orig": "of columns and the overall structure is non-strict. The gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 555.7,
"r_x1": 286.4,
"r_y1": 555.7,
"r_x2": 286.4,
"r_y2": 546.8,
"r_x3": 50.1,
"r_y3": 546.8,
"coord_origin": "TOPLEFT"
},
"text": "eration of missing bounding boxes for non-strict HTML ta-",
"orig": "eration of missing bounding boxes for non-strict HTML ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 567.7,
"r_x1": 257.5,
"r_y1": 567.7,
"r_x2": 257.5,
"r_y2": 558.8,
"r_x3": 50.1,
"r_y3": 558.8,
"coord_origin": "TOPLEFT"
},
"text": "bles is ambiguous and therefore quite challenging.",
"orig": "bles is ambiguous and therefore quite challenging.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.9,
"r_y0": 567.7,
"r_x1": 286.4,
"r_y1": 567.7,
"r_x2": 286.4,
"r_y2": 558.8,
"r_x3": 263.9,
"r_y3": 558.8,
"coord_origin": "TOPLEFT"
},
"text": "Thus,",
"orig": "Thus,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 579.6,
"r_x1": 286.4,
"r_y1": 579.6,
"r_x2": 286.4,
"r_y2": 570.7,
"r_x3": 50.1,
"r_y3": 570.7,
"coord_origin": "TOPLEFT"
},
"text": "we have decided to simply discard those tables. In case of",
"orig": "we have decided to simply discard those tables. In case of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 591.6,
"r_x1": 286.4,
"r_y1": 591.6,
"r_x2": 286.4,
"r_y2": 582.7,
"r_x3": 50.1,
"r_y3": 582.7,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet we have computed missing bounding boxes for",
"orig": "PubTabNet we have computed missing bounding boxes for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 603.5,
"r_x1": 286.4,
"r_y1": 603.5,
"r_x2": 286.4,
"r_y2": 594.6,
"r_x3": 50.1,
"r_y3": 594.6,
"coord_origin": "TOPLEFT"
},
"text": "48% of the simple and 69% of the complex tables. Regard-",
"orig": "48% of the simple and 69% of the complex tables. Regard-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 615.5,
"r_x1": 286.4,
"r_y1": 615.5,
"r_x2": 286.4,
"r_y2": 606.6,
"r_x3": 50.1,
"r_y3": 606.6,
"coord_origin": "TOPLEFT"
},
"text": "ing FinTabNet, 68% of the simple and 98% of the complex",
"orig": "ing FinTabNet, 68% of the simple and 98% of the complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 627.5,
"r_x1": 242.3,
"r_y1": 627.5,
"r_x2": 242.3,
"r_y2": 618.6,
"r_x3": 50.1,
"r_y3": 618.6,
"coord_origin": "TOPLEFT"
},
"text": "tables require the generation of bounding boxes.",
"orig": "tables require the generation of bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 14,
"label": "text",
"bbox": {
"l": 50.1,
"t": 630.7,
"r": 286.4,
"b": 651.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 639.6,
"r_x1": 286.4,
"r_y1": 639.6,
"r_x2": 286.4,
"r_y2": 630.7,
"r_x3": 62.1,
"r_y3": 630.7,
"coord_origin": "TOPLEFT"
},
"text": "Figure 7 illustrates the distribution of the tables across",
"orig": "Figure 7 illustrates the distribution of the tables across",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 651.6,
"r_x1": 179.9,
"r_y1": 651.6,
"r_x2": 179.9,
"r_y2": 642.7,
"r_x3": 50.1,
"r_y3": 642.7,
"coord_origin": "TOPLEFT"
},
"text": "different dimensions per dataset.",
"orig": "different dimensions per dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 12,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 662.4,
"r": 153.6,
"b": 672.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 672.2,
"r_x1": 64.3,
"r_y1": 672.2,
"r_x2": 64.3,
"r_y2": 662.4,
"r_x3": 50.1,
"r_y3": 662.4,
"coord_origin": "TOPLEFT"
},
"text": "1.2.",
"orig": "1.2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.8,
"r_y0": 672.2,
"r_x1": 153.6,
"r_y1": 672.2,
"r_x2": 153.6,
"r_y2": 662.4,
"r_x3": 73.8,
"r_y3": 662.4,
"coord_origin": "TOPLEFT"
},
"text": "Synthetic datasets",
"orig": "Synthetic datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "text",
"bbox": {
"l": 50.1,
"t": 681.3,
"r": 286.4,
"b": 714.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 690.2,
"r_x1": 286.4,
"r_y1": 690.2,
"r_x2": 286.4,
"r_y2": 681.3,
"r_x3": 62.1,
"r_y3": 681.3,
"coord_origin": "TOPLEFT"
},
"text": "Aiming to train and evaluate our models in a broader",
"orig": "Aiming to train and evaluate our models in a broader",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 702.2,
"r_x1": 286.4,
"r_y1": 702.2,
"r_x2": 286.4,
"r_y2": 693.3,
"r_x3": 50.1,
"r_y3": 693.3,
"coord_origin": "TOPLEFT"
},
"text": "spectrum of table data we have synthesized four types of",
"orig": "spectrum of table data we have synthesized four types of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 714.1,
"r_x1": 84.1,
"r_y1": 714.1,
"r_x2": 84.1,
"r_y2": 705.2,
"r_x3": 50.1,
"r_y3": 705.2,
"coord_origin": "TOPLEFT"
},
"text": "datasets.",
"orig": "datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.2,
"r_y0": 714.1,
"r_x1": 286.4,
"r_y1": 714.1,
"r_x2": 286.4,
"r_y2": 705.2,
"r_x3": 91.2,
"r_y3": 705.2,
"coord_origin": "TOPLEFT"
},
"text": "Each one contains tables with different appear-",
"orig": "Each one contains tables with different appear-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 8,
"label": "text",
"bbox": {
"l": 308.9,
"t": 162.7,
"r": 545.1,
"b": 207.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 171.6,
"r_x1": 545.1,
"r_y1": 171.6,
"r_x2": 545.1,
"r_y2": 162.7,
"r_x3": 308.9,
"r_y3": 162.7,
"coord_origin": "TOPLEFT"
},
"text": "ances in regard to their size, structure, style and content.",
"orig": "ances in regard to their size, structure, style and content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 183.5,
"r_x1": 545.1,
"r_y1": 183.5,
"r_x2": 545.1,
"r_y2": 174.6,
"r_x3": 308.9,
"r_y3": 174.6,
"coord_origin": "TOPLEFT"
},
"text": "Every synthetic dataset contains 150k examples, summing",
"orig": "Every synthetic dataset contains 150k examples, summing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 195.5,
"r_x1": 545.1,
"r_y1": 195.5,
"r_x2": 545.1,
"r_y2": 186.6,
"r_x3": 308.9,
"r_y3": 186.6,
"coord_origin": "TOPLEFT"
},
"text": "up to 600k synthetic examples. All datasets are divided into",
"orig": "up to 600k synthetic examples. All datasets are divided into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 207.4,
"r_x1": 484.1,
"r_y1": 207.4,
"r_x2": 484.1,
"r_y2": 198.5,
"r_x3": 308.9,
"r_y3": 198.5,
"coord_origin": "TOPLEFT"
},
"text": "Train, Test and Val splits (80%, 10%, 10%).",
"orig": "Train, Test and Val splits (80%, 10%, 10%).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 15,
"label": "text",
"bbox": {
"l": 308.9,
"t": 211.2,
"r": 545.1,
"b": 232.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 220.1,
"r_x1": 545.1,
"r_y1": 220.1,
"r_x2": 545.1,
"r_y2": 211.2,
"r_x3": 320.8,
"r_y3": 211.2,
"coord_origin": "TOPLEFT"
},
"text": "The process of generating a synthetic dataset can be de-",
"orig": "The process of generating a synthetic dataset can be de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 232.1,
"r_x1": 448.1,
"r_y1": 232.1,
"r_x2": 448.1,
"r_y2": 223.2,
"r_x3": 308.9,
"r_y3": 223.2,
"coord_origin": "TOPLEFT"
},
"text": "composed into the following steps:",
"orig": "composed into the following steps:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 7,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 235.9,
"r": 545.1,
"b": 316.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 244.8,
"r_x1": 328.3,
"r_y1": 244.8,
"r_x2": 328.3,
"r_y2": 235.9,
"r_x3": 320.8,
"r_y3": 235.9,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 335.4,
"r_y0": 244.8,
"r_x1": 545.1,
"r_y1": 244.8,
"r_x2": 545.1,
"r_y2": 235.9,
"r_x3": 335.4,
"r_y3": 235.9,
"coord_origin": "TOPLEFT"
},
"text": "Prepare styling and content templates: The styling",
"orig": "Prepare styling and content templates: The styling",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 256.8,
"r_x1": 545.1,
"r_y1": 256.8,
"r_x2": 545.1,
"r_y2": 247.9,
"r_x3": 308.9,
"r_y3": 247.9,
"coord_origin": "TOPLEFT"
},
"text": "templates have been manually designed and organized into",
"orig": "templates have been manually designed and organized into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 268.7,
"r_x1": 545.1,
"r_y1": 268.7,
"r_x2": 545.1,
"r_y2": 259.8,
"r_x3": 308.9,
"r_y3": 259.8,
"coord_origin": "TOPLEFT"
},
"text": "groups of scope specific appearances (e.g. financial data,",
"orig": "groups of scope specific appearances (e.g. financial data,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 280.7,
"r_x1": 393.4,
"r_y1": 280.7,
"r_x2": 393.4,
"r_y2": 271.8,
"r_x3": 308.9,
"r_y3": 271.8,
"coord_origin": "TOPLEFT"
},
"text": "marketing data, etc.)",
"orig": "marketing data, etc.)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.1,
"r_y0": 280.7,
"r_x1": 545.1,
"r_y1": 280.7,
"r_x2": 545.1,
"r_y2": 271.8,
"r_x3": 400.1,
"r_y3": 271.8,
"coord_origin": "TOPLEFT"
},
"text": "Additionally, we have prepared cu-",
"orig": "Additionally, we have prepared cu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 292.6,
"r_x1": 545.1,
"r_y1": 292.6,
"r_x2": 545.1,
"r_y2": 283.7,
"r_x3": 308.9,
"r_y3": 283.7,
"coord_origin": "TOPLEFT"
},
"text": "rated collections of content templates by extracting the most",
"orig": "rated collections of content templates by extracting the most",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 304.6,
"r_x1": 545.1,
"r_y1": 304.6,
"r_x2": 545.1,
"r_y2": 295.7,
"r_x3": 308.9,
"r_y3": 295.7,
"coord_origin": "TOPLEFT"
},
"text": "frequently used terms out of non-synthetic datasets (e.g.",
"orig": "frequently used terms out of non-synthetic datasets (e.g.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 316.5,
"r_x1": 425.7,
"r_y1": 316.5,
"r_x2": 425.7,
"r_y2": 307.6,
"r_x3": 308.9,
"r_y3": 307.6,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet, FinTabNet, etc.).",
"orig": "PubTabNet, FinTabNet, etc.).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 6,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 320.4,
"r": 545.1,
"b": 448.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 329.3,
"r_x1": 328.5,
"r_y1": 329.3,
"r_x2": 328.5,
"r_y2": 320.4,
"r_x3": 320.8,
"r_y3": 320.4,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.1,
"r_y0": 329.3,
"r_x1": 545.1,
"r_y1": 329.3,
"r_x2": 545.1,
"r_y2": 320.4,
"r_x3": 331.1,
"r_y3": 320.4,
"coord_origin": "TOPLEFT"
},
"text": "Generate table structures: The structure of each syn-",
"orig": "Generate table structures: The structure of each syn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 341.2,
"r_x1": 545.1,
"r_y1": 341.2,
"r_x2": 545.1,
"r_y2": 332.3,
"r_x3": 308.9,
"r_y3": 332.3,
"coord_origin": "TOPLEFT"
},
"text": "thetic dataset assumes a horizontal table header which po-",
"orig": "thetic dataset assumes a horizontal table header which po-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 353.2,
"r_x1": 545.1,
"r_y1": 353.2,
"r_x2": 545.1,
"r_y2": 344.3,
"r_x3": 308.9,
"r_y3": 344.3,
"coord_origin": "TOPLEFT"
},
"text": "tentially spans over multiple rows and a table body that",
"orig": "tentially spans over multiple rows and a table body that",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 365.1,
"r_x1": 545.1,
"r_y1": 365.1,
"r_x2": 545.1,
"r_y2": 356.2,
"r_x3": 308.9,
"r_y3": 356.2,
"coord_origin": "TOPLEFT"
},
"text": "may contain a combination of row spans and column spans.",
"orig": "may contain a combination of row spans and column spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 377.1,
"r_x1": 545.1,
"r_y1": 377.1,
"r_x2": 545.1,
"r_y2": 368.2,
"r_x3": 308.9,
"r_y3": 368.2,
"coord_origin": "TOPLEFT"
},
"text": "However, spans are not allowed to cross the header - body",
"orig": "However, spans are not allowed to cross the header - body",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 389.0,
"r_x1": 545.1,
"r_y1": 389.0,
"r_x2": 545.1,
"r_y2": 380.1,
"r_x3": 308.9,
"r_y3": 380.1,
"coord_origin": "TOPLEFT"
},
"text": "boundary. The table structure is described by the parame-",
"orig": "boundary. The table structure is described by the parame-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 401.0,
"r_x1": 545.1,
"r_y1": 401.0,
"r_x2": 545.1,
"r_y2": 392.1,
"r_x3": 308.9,
"r_y3": 392.1,
"coord_origin": "TOPLEFT"
},
"text": "ters: Total number of table rows and columns, number of",
"orig": "ters: Total number of table rows and columns, number of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 412.9,
"r_x1": 545.1,
"r_y1": 412.9,
"r_x2": 545.1,
"r_y2": 404.0,
"r_x3": 308.9,
"r_y3": 404.0,
"coord_origin": "TOPLEFT"
},
"text": "header rows, type of spans (header only spans, row only",
"orig": "header rows, type of spans (header only spans, row only",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 424.9,
"r_x1": 545.1,
"r_y1": 424.9,
"r_x2": 545.1,
"r_y2": 416.0,
"r_x3": 308.9,
"r_y3": 416.0,
"coord_origin": "TOPLEFT"
},
"text": "spans, column only spans, both row and column spans),",
"orig": "spans, column only spans, both row and column spans),",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 436.9,
"r_x1": 545.1,
"r_y1": 436.9,
"r_x2": 545.1,
"r_y2": 427.9,
"r_x3": 308.9,
"r_y3": 427.9,
"coord_origin": "TOPLEFT"
},
"text": "maximum span size and the ratio of the table area covered",
"orig": "maximum span size and the ratio of the table area covered",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 448.8,
"r_x1": 345.9,
"r_y1": 448.8,
"r_x2": 345.9,
"r_y2": 439.9,
"r_x3": 308.9,
"r_y3": 439.9,
"coord_origin": "TOPLEFT"
},
"text": "by spans.",
"orig": "by spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 9,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 452.6,
"r": 545.1,
"b": 497.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 461.5,
"r_x1": 328.3,
"r_y1": 461.5,
"r_x2": 328.3,
"r_y2": 452.6,
"r_x3": 320.8,
"r_y3": 452.6,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.8,
"r_y0": 461.5,
"r_x1": 485.8,
"r_y1": 461.5,
"r_x2": 485.8,
"r_y2": 452.6,
"r_x3": 330.8,
"r_y3": 452.6,
"coord_origin": "TOPLEFT"
},
"text": "Generate content: Based on the dataset",
"orig": "Generate content: Based on the dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.1,
"r_y0": 461.3,
"r_x1": 511.9,
"r_y1": 461.3,
"r_x2": 511.9,
"r_y2": 452.7,
"r_x3": 488.1,
"r_y3": 452.7,
"coord_origin": "TOPLEFT"
},
"text": "theme",
"orig": "theme",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.9,
"r_y0": 461.5,
"r_x1": 545.1,
"r_y1": 461.5,
"r_x2": 545.1,
"r_y2": 452.6,
"r_x3": 511.9,
"r_y3": 452.6,
"coord_origin": "TOPLEFT"
},
"text": ", a set of",
"orig": ", a set of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 473.5,
"r_x1": 545.1,
"r_y1": 473.5,
"r_x2": 545.1,
"r_y2": 464.6,
"r_x3": 308.9,
"r_y3": 464.6,
"coord_origin": "TOPLEFT"
},
"text": "suitable content templates is chosen first. Then, this content",
"orig": "suitable content templates is chosen first. Then, this content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 485.4,
"r_x1": 545.1,
"r_y1": 485.4,
"r_x2": 545.1,
"r_y2": 476.5,
"r_x3": 308.9,
"r_y3": 476.5,
"coord_origin": "TOPLEFT"
},
"text": "can be combined with purely random text to produce the",
"orig": "can be combined with purely random text to produce the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 497.4,
"r_x1": 379.1,
"r_y1": 497.4,
"r_x2": 379.1,
"r_y2": 488.5,
"r_x3": 308.9,
"r_y3": 488.5,
"coord_origin": "TOPLEFT"
},
"text": "synthetic content.",
"orig": "synthetic content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 5,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 501.2,
"r": 545.1,
"b": 546.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 510.1,
"r_x1": 328.7,
"r_y1": 510.1,
"r_x2": 328.7,
"r_y2": 501.2,
"r_x3": 320.8,
"r_y3": 501.2,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.3,
"r_y0": 510.1,
"r_x1": 545.1,
"r_y1": 510.1,
"r_x2": 545.1,
"r_y2": 501.2,
"r_x3": 331.3,
"r_y3": 501.2,
"coord_origin": "TOPLEFT"
},
"text": "Apply styling templates: Depending on the domain",
"orig": "Apply styling templates: Depending on the domain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 522.1,
"r_x1": 545.1,
"r_y1": 522.1,
"r_x2": 545.1,
"r_y2": 513.2,
"r_x3": 308.9,
"r_y3": 513.2,
"coord_origin": "TOPLEFT"
},
"text": "of the synthetic dataset, a set of styling templates is first",
"orig": "of the synthetic dataset, a set of styling templates is first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 534.0,
"r_x1": 384.3,
"r_y1": 534.0,
"r_x2": 384.3,
"r_y2": 525.1,
"r_x3": 308.9,
"r_y3": 525.1,
"coord_origin": "TOPLEFT"
},
"text": "manually selected.",
"orig": "manually selected.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.3,
"r_y0": 534.0,
"r_x1": 545.1,
"r_y1": 534.0,
"r_x2": 545.1,
"r_y2": 525.1,
"r_x3": 391.3,
"r_y3": 525.1,
"coord_origin": "TOPLEFT"
},
"text": "Then, a style is randomly selected to",
"orig": "Then, a style is randomly selected to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 546.0,
"r_x1": 496.2,
"r_y1": 546.0,
"r_x2": 496.2,
"r_y2": 537.1,
"r_x3": 308.9,
"r_y3": 537.1,
"coord_origin": "TOPLEFT"
},
"text": "format the appearance of the synthesized table.",
"orig": "format the appearance of the synthesized table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 549.8,
"r": 545.1,
"b": 606.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 558.7,
"r_x1": 328.3,
"r_y1": 558.7,
"r_x2": 328.3,
"r_y2": 549.8,
"r_x3": 320.8,
"r_y3": 549.8,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 335.4,
"r_y0": 558.7,
"r_x1": 545.1,
"r_y1": 558.7,
"r_x2": 545.1,
"r_y2": 549.8,
"r_x3": 335.4,
"r_y3": 549.8,
"coord_origin": "TOPLEFT"
},
"text": "Render the complete tables: The synthetic table is",
"orig": "Render the complete tables: The synthetic table is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 570.6,
"r_x1": 545.1,
"r_y1": 570.6,
"r_x2": 545.1,
"r_y2": 561.7,
"r_x3": 308.9,
"r_y3": 561.7,
"coord_origin": "TOPLEFT"
},
"text": "finally rendered by a web browser engine to generate the",
"orig": "finally rendered by a web browser engine to generate the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 582.6,
"r_x1": 545.1,
"r_y1": 582.6,
"r_x2": 545.1,
"r_y2": 573.7,
"r_x3": 308.9,
"r_y3": 573.7,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes for each table cell. A batching technique is",
"orig": "bounding boxes for each table cell. A batching technique is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 594.5,
"r_x1": 545.1,
"r_y1": 594.5,
"r_x2": 545.1,
"r_y2": 585.6,
"r_x3": 308.9,
"r_y3": 585.6,
"coord_origin": "TOPLEFT"
},
"text": "utilized to optimize the runtime overhead of the rendering",
"orig": "utilized to optimize the runtime overhead of the rendering",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 606.5,
"r_x1": 341.2,
"r_y1": 606.5,
"r_x2": 341.2,
"r_y2": 597.6,
"r_x3": 308.9,
"r_y3": 597.6,
"coord_origin": "TOPLEFT"
},
"text": "process.",
"orig": "process.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 10,
"label": "section_header",
"bbox": {
"l": 308.9,
"t": 622.3,
"r": 545.1,
"b": 647.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 633.0,
"r_x1": 316.8,
"r_y1": 633.0,
"r_x2": 316.8,
"r_y2": 622.3,
"r_x3": 308.9,
"r_y3": 622.3,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.3,
"r_y0": 633.0,
"r_x1": 545.1,
"r_y1": 633.0,
"r_x2": 545.1,
"r_y2": 622.3,
"r_x3": 327.3,
"r_y3": 622.3,
"coord_origin": "TOPLEFT"
},
"text": "Prediction post-processing for PDF docu-",
"orig": "Prediction post-processing for PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 647.0,
"r_x1": 357.3,
"r_y1": 647.0,
"r_x2": 357.3,
"r_y2": 636.2,
"r_x3": 326.8,
"r_y3": 636.2,
"coord_origin": "TOPLEFT"
},
"text": "ments",
"orig": "ments",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "text",
"bbox": {
"l": 308.9,
"t": 657.4,
"r": 545.1,
"b": 714.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 666.3,
"r_x1": 545.1,
"r_y1": 666.3,
"r_x2": 545.1,
"r_y2": 657.4,
"r_x3": 320.8,
"r_y3": 657.4,
"coord_origin": "TOPLEFT"
},
"text": "Although TableFormer can predict the table structure and",
"orig": "Although TableFormer can predict the table structure and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 678.3,
"r_x1": 545.1,
"r_y1": 678.3,
"r_x2": 545.1,
"r_y2": 669.4,
"r_x3": 308.9,
"r_y3": 669.4,
"coord_origin": "TOPLEFT"
},
"text": "the bounding boxes for tables recognized inside PDF docu-",
"orig": "the bounding boxes for tables recognized inside PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 690.2,
"r_x1": 545.1,
"r_y1": 690.2,
"r_x2": 545.1,
"r_y2": 681.3,
"r_x3": 308.9,
"r_y3": 681.3,
"coord_origin": "TOPLEFT"
},
"text": "ments, this is not enough when a full reconstruction of the",
"orig": "ments, this is not enough when a full reconstruction of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 702.2,
"r_x1": 545.1,
"r_y1": 702.2,
"r_x2": 545.1,
"r_y2": 693.3,
"r_x3": 308.9,
"r_y3": 693.3,
"coord_origin": "TOPLEFT"
},
"text": "original table is required. This happens mainly due the fol-",
"orig": "original table is required. This happens mainly due the fol-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 714.1,
"r_x1": 371.4,
"r_y1": 714.1,
"r_x2": 371.4,
"r_y2": 705.2,
"r_x3": 308.9,
"r_y3": 705.2,
"coord_origin": "TOPLEFT"
},
"text": "lowing reasons:",
"orig": "lowing reasons:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 16,
"label": "page_footer",
"bbox": {
"l": 292.6,
"t": 734.1,
"r": 302.6,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"tablestructure": {
"table_map": {}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "section_header",
"id": 18,
"page_no": 10,
"cluster": {
"id": 18,
"label": "section_header",
"bbox": {
"l": 132.8,
"t": 110.6,
"r": 465.4,
"b": 135.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.65,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 132.8,
"r_y0": 121.3,
"r_x1": 465.4,
"r_y1": 121.3,
"r_x2": 465.4,
"r_y2": 110.6,
"r_x3": 132.8,
"r_y3": 110.6,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer: Table Structure Understanding with Transformers",
"orig": "TableFormer: Table Structure Understanding with Transformers",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.2,
"r_y0": 135.5,
"r_x1": 375.0,
"r_y1": 135.5,
"r_x2": 375.0,
"r_y2": 122.3,
"r_x3": 220.2,
"r_y3": 122.3,
"coord_origin": "TOPLEFT"
},
"text": "Supplementary Material",
"orig": "Supplementary Material",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TableFormer: Table Structure Understanding with Transformers Supplementary Material"
},
{
"label": "section_header",
"id": 13,
"page_no": 10,
"cluster": {
"id": 13,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 161.2,
"r": 176.0,
"b": 171.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 171.9,
"r_x1": 57.1,
"r_y1": 171.9,
"r_x2": 57.1,
"r_y2": 161.2,
"r_x3": 50.1,
"r_y3": 161.2,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.4,
"r_y0": 171.9,
"r_x1": 176.0,
"r_y1": 171.9,
"r_x2": 176.0,
"r_y2": 161.2,
"r_x3": 66.4,
"r_y3": 161.2,
"coord_origin": "TOPLEFT"
},
"text": "Details on the datasets",
"orig": "Details on the datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1. Details on the datasets"
},
{
"label": "section_header",
"id": 11,
"page_no": 10,
"cluster": {
"id": 11,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 181.0,
"r": 150.4,
"b": 190.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 190.8,
"r_x1": 64.2,
"r_y1": 190.8,
"r_x2": 64.2,
"r_y2": 181.0,
"r_x3": 50.1,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "1.1.",
"orig": "1.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.6,
"r_y0": 190.8,
"r_x1": 150.4,
"r_y1": 190.8,
"r_x2": 150.4,
"r_y2": 181.0,
"r_x3": 73.6,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "Data preparation",
"orig": "Data preparation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1.1. Data preparation"
},
{
"label": "text",
"id": 0,
"page_no": 10,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 50.1,
"t": 199.9,
"r": 286.4,
"b": 388.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 208.8,
"r_x1": 286.4,
"r_y1": 208.8,
"r_x2": 286.4,
"r_y2": 199.9,
"r_x3": 62.1,
"r_y3": 199.9,
"coord_origin": "TOPLEFT"
},
"text": "As a first step of our data preparation process, we have",
"orig": "As a first step of our data preparation process, we have",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 220.8,
"r_x1": 286.4,
"r_y1": 220.8,
"r_x2": 286.4,
"r_y2": 211.9,
"r_x3": 50.1,
"r_y3": 211.9,
"coord_origin": "TOPLEFT"
},
"text": "calculated statistics over the datasets across the following",
"orig": "calculated statistics over the datasets across the following",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 232.7,
"r_x1": 286.4,
"r_y1": 232.7,
"r_x2": 286.4,
"r_y2": 223.8,
"r_x3": 50.1,
"r_y3": 223.8,
"coord_origin": "TOPLEFT"
},
"text": "dimensions: (1) table size measured in the number of rows",
"orig": "dimensions: (1) table size measured in the number of rows",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 244.7,
"r_x1": 286.4,
"r_y1": 244.7,
"r_x2": 286.4,
"r_y2": 235.8,
"r_x3": 50.1,
"r_y3": 235.8,
"coord_origin": "TOPLEFT"
},
"text": "and columns, (2) complexity of the table, (3) strictness of",
"orig": "and columns, (2) complexity of the table, (3) strictness of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 256.6,
"r_x1": 286.4,
"r_y1": 256.6,
"r_x2": 286.4,
"r_y2": 247.7,
"r_x3": 50.1,
"r_y3": 247.7,
"coord_origin": "TOPLEFT"
},
"text": "the provided HTML structure and (4) completeness (i.e. no",
"orig": "the provided HTML structure and (4) completeness (i.e. no",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 268.6,
"r_x1": 286.4,
"r_y1": 268.6,
"r_x2": 286.4,
"r_y2": 259.7,
"r_x3": 50.1,
"r_y3": 259.7,
"coord_origin": "TOPLEFT"
},
"text": "omitted bounding boxes). A table is considered to be simple",
"orig": "omitted bounding boxes). A table is considered to be simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 280.6,
"r_x1": 286.4,
"r_y1": 280.6,
"r_x2": 286.4,
"r_y2": 271.7,
"r_x3": 50.1,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "if it does not contain row spans or column spans. Addition-",
"orig": "if it does not contain row spans or column spans. Addition-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 292.5,
"r_x1": 286.4,
"r_y1": 292.5,
"r_x2": 286.4,
"r_y2": 283.6,
"r_x3": 50.1,
"r_y3": 283.6,
"coord_origin": "TOPLEFT"
},
"text": "ally, a table has a strict HTML structure if every row has the",
"orig": "ally, a table has a strict HTML structure if every row has the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 304.5,
"r_x1": 286.4,
"r_y1": 304.5,
"r_x2": 286.4,
"r_y2": 295.6,
"r_x3": 50.1,
"r_y3": 295.6,
"coord_origin": "TOPLEFT"
},
"text": "same number of columns after taking into account any row",
"orig": "same number of columns after taking into account any row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 316.4,
"r_x1": 286.4,
"r_y1": 316.4,
"r_x2": 286.4,
"r_y2": 307.5,
"r_x3": 50.1,
"r_y3": 307.5,
"coord_origin": "TOPLEFT"
},
"text": "or column spans. Therefore a strict HTML structure looks",
"orig": "or column spans. Therefore a strict HTML structure looks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 328.4,
"r_x1": 286.4,
"r_y1": 328.4,
"r_x2": 286.4,
"r_y2": 319.5,
"r_x3": 50.1,
"r_y3": 319.5,
"coord_origin": "TOPLEFT"
},
"text": "always rectangular. However, HTML is a lenient encoding",
"orig": "always rectangular. However, HTML is a lenient encoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 340.3,
"r_x1": 286.4,
"r_y1": 340.3,
"r_x2": 286.4,
"r_y2": 331.4,
"r_x3": 50.1,
"r_y3": 331.4,
"coord_origin": "TOPLEFT"
},
"text": "format, i.e. tables with rows of different sizes might still",
"orig": "format, i.e. tables with rows of different sizes might still",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 352.3,
"r_x1": 286.4,
"r_y1": 352.3,
"r_x2": 286.4,
"r_y2": 343.4,
"r_x3": 50.1,
"r_y3": 343.4,
"coord_origin": "TOPLEFT"
},
"text": "be regarded as correct due to implicit display rules. These",
"orig": "be regarded as correct due to implicit display rules. These",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 364.2,
"r_x1": 286.4,
"r_y1": 364.2,
"r_x2": 286.4,
"r_y2": 355.3,
"r_x3": 50.1,
"r_y3": 355.3,
"coord_origin": "TOPLEFT"
},
"text": "implicit rules leave room for ambiguity, which we want to",
"orig": "implicit rules leave room for ambiguity, which we want to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 376.2,
"r_x1": 286.4,
"r_y1": 376.2,
"r_x2": 286.4,
"r_y2": 367.3,
"r_x3": 50.1,
"r_y3": 367.3,
"coord_origin": "TOPLEFT"
},
"text": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables",
"orig": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 388.2,
"r_x1": 230.8,
"r_y1": 388.2,
"r_x2": 230.8,
"r_y2": 379.2,
"r_x3": 50.1,
"r_y3": 379.2,
"coord_origin": "TOPLEFT"
},
"text": "where every row has exactly the same length.",
"orig": "where every row has exactly the same length.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "As a first step of our data preparation process, we have calculated statistics over the datasets across the following dimensions: (1) table size measured in the number of rows and columns, (2) complexity of the table, (3) strictness of the provided HTML structure and (4) completeness (i.e. no omitted bounding boxes). A table is considered to be simple if it does not contain row spans or column spans. Additionally, a table has a strict HTML structure if every row has the same number of columns after taking into account any row or column spans. Therefore a strict HTML structure looks always rectangular. However, HTML is a lenient encoding format, i.e. tables with rows of different sizes might still be regarded as correct due to implicit display rules. These implicit rules leave room for ambiguity, which we want to avoid. As such, we prefer to have \"strict\" tables, i.e. tables where every row has exactly the same length."
},
{
"label": "text",
"id": 2,
"page_no": 10,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 50.1,
"t": 391.4,
"r": 286.4,
"b": 627.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 400.3,
"r_x1": 286.4,
"r_y1": 400.3,
"r_x2": 286.4,
"r_y2": 391.4,
"r_x3": 62.1,
"r_y3": 391.4,
"coord_origin": "TOPLEFT"
},
"text": "We have developed a technique that tries to derive a",
"orig": "We have developed a technique that tries to derive a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 412.3,
"r_x1": 286.4,
"r_y1": 412.3,
"r_x2": 286.4,
"r_y2": 403.4,
"r_x3": 50.1,
"r_y3": 403.4,
"coord_origin": "TOPLEFT"
},
"text": "missing bounding box out of its neighbors. As a first step,",
"orig": "missing bounding box out of its neighbors. As a first step,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 424.2,
"r_x1": 286.4,
"r_y1": 424.2,
"r_x2": 286.4,
"r_y2": 415.3,
"r_x3": 50.1,
"r_y3": 415.3,
"coord_origin": "TOPLEFT"
},
"text": "we use the annotation data to generate the most fine-grained",
"orig": "we use the annotation data to generate the most fine-grained",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 436.2,
"r_x1": 286.4,
"r_y1": 436.2,
"r_x2": 286.4,
"r_y2": 427.3,
"r_x3": 50.1,
"r_y3": 427.3,
"coord_origin": "TOPLEFT"
},
"text": "grid that covers the table structure. In case of strict HTML",
"orig": "grid that covers the table structure. In case of strict HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 448.1,
"r_x1": 286.4,
"r_y1": 448.1,
"r_x2": 286.4,
"r_y2": 439.2,
"r_x3": 50.1,
"r_y3": 439.2,
"coord_origin": "TOPLEFT"
},
"text": "tables, all grid squares are associated with some table cell",
"orig": "tables, all grid squares are associated with some table cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 460.1,
"r_x1": 286.4,
"r_y1": 460.1,
"r_x2": 286.4,
"r_y2": 451.2,
"r_x3": 50.1,
"r_y3": 451.2,
"coord_origin": "TOPLEFT"
},
"text": "and in the presence of table spans a cell extends across mul-",
"orig": "and in the presence of table spans a cell extends across mul-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 472.0,
"r_x1": 286.4,
"r_y1": 472.0,
"r_x2": 286.4,
"r_y2": 463.1,
"r_x3": 50.1,
"r_y3": 463.1,
"coord_origin": "TOPLEFT"
},
"text": "tiple grid squares. When enough bounding boxes are known",
"orig": "tiple grid squares. When enough bounding boxes are known",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 484.0,
"r_x1": 286.4,
"r_y1": 484.0,
"r_x2": 286.4,
"r_y2": 475.1,
"r_x3": 50.1,
"r_y3": 475.1,
"coord_origin": "TOPLEFT"
},
"text": "for a rectangular table, it is possible to compute the geo-",
"orig": "for a rectangular table, it is possible to compute the geo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 496.0,
"r_x1": 286.4,
"r_y1": 496.0,
"r_x2": 286.4,
"r_y2": 487.0,
"r_x3": 50.1,
"r_y3": 487.0,
"coord_origin": "TOPLEFT"
},
"text": "metrical border lines between the grid rows and columns.",
"orig": "metrical border lines between the grid rows and columns.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 507.9,
"r_x1": 286.4,
"r_y1": 507.9,
"r_x2": 286.4,
"r_y2": 499.0,
"r_x3": 50.1,
"r_y3": 499.0,
"coord_origin": "TOPLEFT"
},
"text": "Eventually this information is used to generate the missing",
"orig": "Eventually this information is used to generate the missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 519.9,
"r_x1": 286.4,
"r_y1": 519.9,
"r_x2": 286.4,
"r_y2": 511.0,
"r_x3": 50.1,
"r_y3": 511.0,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes. Additionally, the existence of unused grid",
"orig": "bounding boxes. Additionally, the existence of unused grid",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 531.8,
"r_x1": 286.4,
"r_y1": 531.8,
"r_x2": 286.4,
"r_y2": 522.9,
"r_x3": 50.1,
"r_y3": 522.9,
"coord_origin": "TOPLEFT"
},
"text": "squares indicates that the table rows have unequal number",
"orig": "squares indicates that the table rows have unequal number",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 543.8,
"r_x1": 286.4,
"r_y1": 543.8,
"r_x2": 286.4,
"r_y2": 534.9,
"r_x3": 50.1,
"r_y3": 534.9,
"coord_origin": "TOPLEFT"
},
"text": "of columns and the overall structure is non-strict. The gen-",
"orig": "of columns and the overall structure is non-strict. The gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 555.7,
"r_x1": 286.4,
"r_y1": 555.7,
"r_x2": 286.4,
"r_y2": 546.8,
"r_x3": 50.1,
"r_y3": 546.8,
"coord_origin": "TOPLEFT"
},
"text": "eration of missing bounding boxes for non-strict HTML ta-",
"orig": "eration of missing bounding boxes for non-strict HTML ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 567.7,
"r_x1": 257.5,
"r_y1": 567.7,
"r_x2": 257.5,
"r_y2": 558.8,
"r_x3": 50.1,
"r_y3": 558.8,
"coord_origin": "TOPLEFT"
},
"text": "bles is ambiguous and therefore quite challenging.",
"orig": "bles is ambiguous and therefore quite challenging.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.9,
"r_y0": 567.7,
"r_x1": 286.4,
"r_y1": 567.7,
"r_x2": 286.4,
"r_y2": 558.8,
"r_x3": 263.9,
"r_y3": 558.8,
"coord_origin": "TOPLEFT"
},
"text": "Thus,",
"orig": "Thus,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 579.6,
"r_x1": 286.4,
"r_y1": 579.6,
"r_x2": 286.4,
"r_y2": 570.7,
"r_x3": 50.1,
"r_y3": 570.7,
"coord_origin": "TOPLEFT"
},
"text": "we have decided to simply discard those tables. In case of",
"orig": "we have decided to simply discard those tables. In case of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 591.6,
"r_x1": 286.4,
"r_y1": 591.6,
"r_x2": 286.4,
"r_y2": 582.7,
"r_x3": 50.1,
"r_y3": 582.7,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet we have computed missing bounding boxes for",
"orig": "PubTabNet we have computed missing bounding boxes for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 603.5,
"r_x1": 286.4,
"r_y1": 603.5,
"r_x2": 286.4,
"r_y2": 594.6,
"r_x3": 50.1,
"r_y3": 594.6,
"coord_origin": "TOPLEFT"
},
"text": "48% of the simple and 69% of the complex tables. Regard-",
"orig": "48% of the simple and 69% of the complex tables. Regard-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 615.5,
"r_x1": 286.4,
"r_y1": 615.5,
"r_x2": 286.4,
"r_y2": 606.6,
"r_x3": 50.1,
"r_y3": 606.6,
"coord_origin": "TOPLEFT"
},
"text": "ing FinTabNet, 68% of the simple and 98% of the complex",
"orig": "ing FinTabNet, 68% of the simple and 98% of the complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 627.5,
"r_x1": 242.3,
"r_y1": 627.5,
"r_x2": 242.3,
"r_y2": 618.6,
"r_x3": 50.1,
"r_y3": 618.6,
"coord_origin": "TOPLEFT"
},
"text": "tables require the generation of bounding boxes.",
"orig": "tables require the generation of bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "We have developed a technique that tries to derive a missing bounding box out of its neighbors. As a first step, we use the annotation data to generate the most fine-grained grid that covers the table structure. In case of strict HTML tables, all grid squares are associated with some table cell and in the presence of table spans a cell extends across multiple grid squares. When enough bounding boxes are known for a rectangular table, it is possible to compute the geometrical border lines between the grid rows and columns. Eventually this information is used to generate the missing bounding boxes. Additionally, the existence of unused grid squares indicates that the table rows have unequal number of columns and the overall structure is non-strict. The generation of missing bounding boxes for non-strict HTML tables is ambiguous and therefore quite challenging. Thus, we have decided to simply discard those tables. In case of PubTabNet we have computed missing bounding boxes for 48% of the simple and 69% of the complex tables. Regarding FinTabNet, 68% of the simple and 98% of the complex tables require the generation of bounding boxes."
},
{
"label": "text",
"id": 14,
"page_no": 10,
"cluster": {
"id": 14,
"label": "text",
"bbox": {
"l": 50.1,
"t": 630.7,
"r": 286.4,
"b": 651.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 639.6,
"r_x1": 286.4,
"r_y1": 639.6,
"r_x2": 286.4,
"r_y2": 630.7,
"r_x3": 62.1,
"r_y3": 630.7,
"coord_origin": "TOPLEFT"
},
"text": "Figure 7 illustrates the distribution of the tables across",
"orig": "Figure 7 illustrates the distribution of the tables across",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 651.6,
"r_x1": 179.9,
"r_y1": 651.6,
"r_x2": 179.9,
"r_y2": 642.7,
"r_x3": 50.1,
"r_y3": 642.7,
"coord_origin": "TOPLEFT"
},
"text": "different dimensions per dataset.",
"orig": "different dimensions per dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 7 illustrates the distribution of the tables across different dimensions per dataset."
},
{
"label": "section_header",
"id": 12,
"page_no": 10,
"cluster": {
"id": 12,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 662.4,
"r": 153.6,
"b": 672.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 672.2,
"r_x1": 64.3,
"r_y1": 672.2,
"r_x2": 64.3,
"r_y2": 662.4,
"r_x3": 50.1,
"r_y3": 662.4,
"coord_origin": "TOPLEFT"
},
"text": "1.2.",
"orig": "1.2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.8,
"r_y0": 672.2,
"r_x1": 153.6,
"r_y1": 672.2,
"r_x2": 153.6,
"r_y2": 662.4,
"r_x3": 73.8,
"r_y3": 662.4,
"coord_origin": "TOPLEFT"
},
"text": "Synthetic datasets",
"orig": "Synthetic datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1.2. Synthetic datasets"
},
{
"label": "text",
"id": 3,
"page_no": 10,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 50.1,
"t": 681.3,
"r": 286.4,
"b": 714.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 690.2,
"r_x1": 286.4,
"r_y1": 690.2,
"r_x2": 286.4,
"r_y2": 681.3,
"r_x3": 62.1,
"r_y3": 681.3,
"coord_origin": "TOPLEFT"
},
"text": "Aiming to train and evaluate our models in a broader",
"orig": "Aiming to train and evaluate our models in a broader",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 702.2,
"r_x1": 286.4,
"r_y1": 702.2,
"r_x2": 286.4,
"r_y2": 693.3,
"r_x3": 50.1,
"r_y3": 693.3,
"coord_origin": "TOPLEFT"
},
"text": "spectrum of table data we have synthesized four types of",
"orig": "spectrum of table data we have synthesized four types of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 714.1,
"r_x1": 84.1,
"r_y1": 714.1,
"r_x2": 84.1,
"r_y2": 705.2,
"r_x3": 50.1,
"r_y3": 705.2,
"coord_origin": "TOPLEFT"
},
"text": "datasets.",
"orig": "datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.2,
"r_y0": 714.1,
"r_x1": 286.4,
"r_y1": 714.1,
"r_x2": 286.4,
"r_y2": 705.2,
"r_x3": 91.2,
"r_y3": 705.2,
"coord_origin": "TOPLEFT"
},
"text": "Each one contains tables with different appear-",
"orig": "Each one contains tables with different appear-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Aiming to train and evaluate our models in a broader spectrum of table data we have synthesized four types of datasets. Each one contains tables with different appear-"
},
{
"label": "text",
"id": 8,
"page_no": 10,
"cluster": {
"id": 8,
"label": "text",
"bbox": {
"l": 308.9,
"t": 162.7,
"r": 545.1,
"b": 207.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 171.6,
"r_x1": 545.1,
"r_y1": 171.6,
"r_x2": 545.1,
"r_y2": 162.7,
"r_x3": 308.9,
"r_y3": 162.7,
"coord_origin": "TOPLEFT"
},
"text": "ances in regard to their size, structure, style and content.",
"orig": "ances in regard to their size, structure, style and content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 183.5,
"r_x1": 545.1,
"r_y1": 183.5,
"r_x2": 545.1,
"r_y2": 174.6,
"r_x3": 308.9,
"r_y3": 174.6,
"coord_origin": "TOPLEFT"
},
"text": "Every synthetic dataset contains 150k examples, summing",
"orig": "Every synthetic dataset contains 150k examples, summing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 195.5,
"r_x1": 545.1,
"r_y1": 195.5,
"r_x2": 545.1,
"r_y2": 186.6,
"r_x3": 308.9,
"r_y3": 186.6,
"coord_origin": "TOPLEFT"
},
"text": "up to 600k synthetic examples. All datasets are divided into",
"orig": "up to 600k synthetic examples. All datasets are divided into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 207.4,
"r_x1": 484.1,
"r_y1": 207.4,
"r_x2": 484.1,
"r_y2": 198.5,
"r_x3": 308.9,
"r_y3": 198.5,
"coord_origin": "TOPLEFT"
},
"text": "Train, Test and Val splits (80%, 10%, 10%).",
"orig": "Train, Test and Val splits (80%, 10%, 10%).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "ances in regard to their size, structure, style and content. Every synthetic dataset contains 150k examples, summing up to 600k synthetic examples. All datasets are divided into Train, Test and Val splits (80%, 10%, 10%)."
},
{
"label": "text",
"id": 15,
"page_no": 10,
"cluster": {
"id": 15,
"label": "text",
"bbox": {
"l": 308.9,
"t": 211.2,
"r": 545.1,
"b": 232.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 220.1,
"r_x1": 545.1,
"r_y1": 220.1,
"r_x2": 545.1,
"r_y2": 211.2,
"r_x3": 320.8,
"r_y3": 211.2,
"coord_origin": "TOPLEFT"
},
"text": "The process of generating a synthetic dataset can be de-",
"orig": "The process of generating a synthetic dataset can be de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 232.1,
"r_x1": 448.1,
"r_y1": 232.1,
"r_x2": 448.1,
"r_y2": 223.2,
"r_x3": 308.9,
"r_y3": 223.2,
"coord_origin": "TOPLEFT"
},
"text": "composed into the following steps:",
"orig": "composed into the following steps:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The process of generating a synthetic dataset can be decomposed into the following steps:"
},
{
"label": "list_item",
"id": 7,
"page_no": 10,
"cluster": {
"id": 7,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 235.9,
"r": 545.1,
"b": 316.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 244.8,
"r_x1": 328.3,
"r_y1": 244.8,
"r_x2": 328.3,
"r_y2": 235.9,
"r_x3": 320.8,
"r_y3": 235.9,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 335.4,
"r_y0": 244.8,
"r_x1": 545.1,
"r_y1": 244.8,
"r_x2": 545.1,
"r_y2": 235.9,
"r_x3": 335.4,
"r_y3": 235.9,
"coord_origin": "TOPLEFT"
},
"text": "Prepare styling and content templates: The styling",
"orig": "Prepare styling and content templates: The styling",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 256.8,
"r_x1": 545.1,
"r_y1": 256.8,
"r_x2": 545.1,
"r_y2": 247.9,
"r_x3": 308.9,
"r_y3": 247.9,
"coord_origin": "TOPLEFT"
},
"text": "templates have been manually designed and organized into",
"orig": "templates have been manually designed and organized into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 268.7,
"r_x1": 545.1,
"r_y1": 268.7,
"r_x2": 545.1,
"r_y2": 259.8,
"r_x3": 308.9,
"r_y3": 259.8,
"coord_origin": "TOPLEFT"
},
"text": "groups of scope specific appearances (e.g. financial data,",
"orig": "groups of scope specific appearances (e.g. financial data,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 280.7,
"r_x1": 393.4,
"r_y1": 280.7,
"r_x2": 393.4,
"r_y2": 271.8,
"r_x3": 308.9,
"r_y3": 271.8,
"coord_origin": "TOPLEFT"
},
"text": "marketing data, etc.)",
"orig": "marketing data, etc.)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.1,
"r_y0": 280.7,
"r_x1": 545.1,
"r_y1": 280.7,
"r_x2": 545.1,
"r_y2": 271.8,
"r_x3": 400.1,
"r_y3": 271.8,
"coord_origin": "TOPLEFT"
},
"text": "Additionally, we have prepared cu-",
"orig": "Additionally, we have prepared cu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 292.6,
"r_x1": 545.1,
"r_y1": 292.6,
"r_x2": 545.1,
"r_y2": 283.7,
"r_x3": 308.9,
"r_y3": 283.7,
"coord_origin": "TOPLEFT"
},
"text": "rated collections of content templates by extracting the most",
"orig": "rated collections of content templates by extracting the most",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 304.6,
"r_x1": 545.1,
"r_y1": 304.6,
"r_x2": 545.1,
"r_y2": 295.7,
"r_x3": 308.9,
"r_y3": 295.7,
"coord_origin": "TOPLEFT"
},
"text": "frequently used terms out of non-synthetic datasets (e.g.",
"orig": "frequently used terms out of non-synthetic datasets (e.g.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 316.5,
"r_x1": 425.7,
"r_y1": 316.5,
"r_x2": 425.7,
"r_y2": 307.6,
"r_x3": 308.9,
"r_y3": 307.6,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet, FinTabNet, etc.).",
"orig": "PubTabNet, FinTabNet, etc.).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1. Prepare styling and content templates: The styling templates have been manually designed and organized into groups of scope specific appearances (e.g. financial data, marketing data, etc.) Additionally, we have prepared curated collections of content templates by extracting the most frequently used terms out of non-synthetic datasets (e.g. PubTabNet, FinTabNet, etc.)."
},
{
"label": "list_item",
"id": 6,
"page_no": 10,
"cluster": {
"id": 6,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 320.4,
"r": 545.1,
"b": 448.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 329.3,
"r_x1": 328.5,
"r_y1": 329.3,
"r_x2": 328.5,
"r_y2": 320.4,
"r_x3": 320.8,
"r_y3": 320.4,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.1,
"r_y0": 329.3,
"r_x1": 545.1,
"r_y1": 329.3,
"r_x2": 545.1,
"r_y2": 320.4,
"r_x3": 331.1,
"r_y3": 320.4,
"coord_origin": "TOPLEFT"
},
"text": "Generate table structures: The structure of each syn-",
"orig": "Generate table structures: The structure of each syn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 341.2,
"r_x1": 545.1,
"r_y1": 341.2,
"r_x2": 545.1,
"r_y2": 332.3,
"r_x3": 308.9,
"r_y3": 332.3,
"coord_origin": "TOPLEFT"
},
"text": "thetic dataset assumes a horizontal table header which po-",
"orig": "thetic dataset assumes a horizontal table header which po-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 353.2,
"r_x1": 545.1,
"r_y1": 353.2,
"r_x2": 545.1,
"r_y2": 344.3,
"r_x3": 308.9,
"r_y3": 344.3,
"coord_origin": "TOPLEFT"
},
"text": "tentially spans over multiple rows and a table body that",
"orig": "tentially spans over multiple rows and a table body that",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 365.1,
"r_x1": 545.1,
"r_y1": 365.1,
"r_x2": 545.1,
"r_y2": 356.2,
"r_x3": 308.9,
"r_y3": 356.2,
"coord_origin": "TOPLEFT"
},
"text": "may contain a combination of row spans and column spans.",
"orig": "may contain a combination of row spans and column spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 377.1,
"r_x1": 545.1,
"r_y1": 377.1,
"r_x2": 545.1,
"r_y2": 368.2,
"r_x3": 308.9,
"r_y3": 368.2,
"coord_origin": "TOPLEFT"
},
"text": "However, spans are not allowed to cross the header - body",
"orig": "However, spans are not allowed to cross the header - body",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 389.0,
"r_x1": 545.1,
"r_y1": 389.0,
"r_x2": 545.1,
"r_y2": 380.1,
"r_x3": 308.9,
"r_y3": 380.1,
"coord_origin": "TOPLEFT"
},
"text": "boundary. The table structure is described by the parame-",
"orig": "boundary. The table structure is described by the parame-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 401.0,
"r_x1": 545.1,
"r_y1": 401.0,
"r_x2": 545.1,
"r_y2": 392.1,
"r_x3": 308.9,
"r_y3": 392.1,
"coord_origin": "TOPLEFT"
},
"text": "ters: Total number of table rows and columns, number of",
"orig": "ters: Total number of table rows and columns, number of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 412.9,
"r_x1": 545.1,
"r_y1": 412.9,
"r_x2": 545.1,
"r_y2": 404.0,
"r_x3": 308.9,
"r_y3": 404.0,
"coord_origin": "TOPLEFT"
},
"text": "header rows, type of spans (header only spans, row only",
"orig": "header rows, type of spans (header only spans, row only",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 424.9,
"r_x1": 545.1,
"r_y1": 424.9,
"r_x2": 545.1,
"r_y2": 416.0,
"r_x3": 308.9,
"r_y3": 416.0,
"coord_origin": "TOPLEFT"
},
"text": "spans, column only spans, both row and column spans),",
"orig": "spans, column only spans, both row and column spans),",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 436.9,
"r_x1": 545.1,
"r_y1": 436.9,
"r_x2": 545.1,
"r_y2": 427.9,
"r_x3": 308.9,
"r_y3": 427.9,
"coord_origin": "TOPLEFT"
},
"text": "maximum span size and the ratio of the table area covered",
"orig": "maximum span size and the ratio of the table area covered",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 448.8,
"r_x1": 345.9,
"r_y1": 448.8,
"r_x2": 345.9,
"r_y2": 439.9,
"r_x3": 308.9,
"r_y3": 439.9,
"coord_origin": "TOPLEFT"
},
"text": "by spans.",
"orig": "by spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "2. Generate table structures: The structure of each synthetic dataset assumes a horizontal table header which potentially spans over multiple rows and a table body that may contain a combination of row spans and column spans. However, spans are not allowed to cross the header - body boundary. The table structure is described by the parameters: Total number of table rows and columns, number of header rows, type of spans (header only spans, row only spans, column only spans, both row and column spans), maximum span size and the ratio of the table area covered by spans."
},
{
"label": "list_item",
"id": 9,
"page_no": 10,
"cluster": {
"id": 9,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 452.6,
"r": 545.1,
"b": 497.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 461.5,
"r_x1": 328.3,
"r_y1": 461.5,
"r_x2": 328.3,
"r_y2": 452.6,
"r_x3": 320.8,
"r_y3": 452.6,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.8,
"r_y0": 461.5,
"r_x1": 485.8,
"r_y1": 461.5,
"r_x2": 485.8,
"r_y2": 452.6,
"r_x3": 330.8,
"r_y3": 452.6,
"coord_origin": "TOPLEFT"
},
"text": "Generate content: Based on the dataset",
"orig": "Generate content: Based on the dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.1,
"r_y0": 461.3,
"r_x1": 511.9,
"r_y1": 461.3,
"r_x2": 511.9,
"r_y2": 452.7,
"r_x3": 488.1,
"r_y3": 452.7,
"coord_origin": "TOPLEFT"
},
"text": "theme",
"orig": "theme",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.9,
"r_y0": 461.5,
"r_x1": 545.1,
"r_y1": 461.5,
"r_x2": 545.1,
"r_y2": 452.6,
"r_x3": 511.9,
"r_y3": 452.6,
"coord_origin": "TOPLEFT"
},
"text": ", a set of",
"orig": ", a set of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 473.5,
"r_x1": 545.1,
"r_y1": 473.5,
"r_x2": 545.1,
"r_y2": 464.6,
"r_x3": 308.9,
"r_y3": 464.6,
"coord_origin": "TOPLEFT"
},
"text": "suitable content templates is chosen first. Then, this content",
"orig": "suitable content templates is chosen first. Then, this content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 485.4,
"r_x1": 545.1,
"r_y1": 485.4,
"r_x2": 545.1,
"r_y2": 476.5,
"r_x3": 308.9,
"r_y3": 476.5,
"coord_origin": "TOPLEFT"
},
"text": "can be combined with purely random text to produce the",
"orig": "can be combined with purely random text to produce the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 497.4,
"r_x1": 379.1,
"r_y1": 497.4,
"r_x2": 379.1,
"r_y2": 488.5,
"r_x3": 308.9,
"r_y3": 488.5,
"coord_origin": "TOPLEFT"
},
"text": "synthetic content.",
"orig": "synthetic content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "3. Generate content: Based on the dataset theme , a set of suitable content templates is chosen first. Then, this content can be combined with purely random text to produce the synthetic content."
},
{
"label": "list_item",
"id": 5,
"page_no": 10,
"cluster": {
"id": 5,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 501.2,
"r": 545.1,
"b": 546.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 510.1,
"r_x1": 328.7,
"r_y1": 510.1,
"r_x2": 328.7,
"r_y2": 501.2,
"r_x3": 320.8,
"r_y3": 501.2,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.3,
"r_y0": 510.1,
"r_x1": 545.1,
"r_y1": 510.1,
"r_x2": 545.1,
"r_y2": 501.2,
"r_x3": 331.3,
"r_y3": 501.2,
"coord_origin": "TOPLEFT"
},
"text": "Apply styling templates: Depending on the domain",
"orig": "Apply styling templates: Depending on the domain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 522.1,
"r_x1": 545.1,
"r_y1": 522.1,
"r_x2": 545.1,
"r_y2": 513.2,
"r_x3": 308.9,
"r_y3": 513.2,
"coord_origin": "TOPLEFT"
},
"text": "of the synthetic dataset, a set of styling templates is first",
"orig": "of the synthetic dataset, a set of styling templates is first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 534.0,
"r_x1": 384.3,
"r_y1": 534.0,
"r_x2": 384.3,
"r_y2": 525.1,
"r_x3": 308.9,
"r_y3": 525.1,
"coord_origin": "TOPLEFT"
},
"text": "manually selected.",
"orig": "manually selected.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.3,
"r_y0": 534.0,
"r_x1": 545.1,
"r_y1": 534.0,
"r_x2": 545.1,
"r_y2": 525.1,
"r_x3": 391.3,
"r_y3": 525.1,
"coord_origin": "TOPLEFT"
},
"text": "Then, a style is randomly selected to",
"orig": "Then, a style is randomly selected to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 546.0,
"r_x1": 496.2,
"r_y1": 546.0,
"r_x2": 496.2,
"r_y2": 537.1,
"r_x3": 308.9,
"r_y3": 537.1,
"coord_origin": "TOPLEFT"
},
"text": "format the appearance of the synthesized table.",
"orig": "format the appearance of the synthesized table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "4. Apply styling templates: Depending on the domain of the synthetic dataset, a set of styling templates is first manually selected. Then, a style is randomly selected to format the appearance of the synthesized table."
},
{
"label": "list_item",
"id": 4,
"page_no": 10,
"cluster": {
"id": 4,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 549.8,
"r": 545.1,
"b": 606.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 558.7,
"r_x1": 328.3,
"r_y1": 558.7,
"r_x2": 328.3,
"r_y2": 549.8,
"r_x3": 320.8,
"r_y3": 549.8,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 335.4,
"r_y0": 558.7,
"r_x1": 545.1,
"r_y1": 558.7,
"r_x2": 545.1,
"r_y2": 549.8,
"r_x3": 335.4,
"r_y3": 549.8,
"coord_origin": "TOPLEFT"
},
"text": "Render the complete tables: The synthetic table is",
"orig": "Render the complete tables: The synthetic table is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 570.6,
"r_x1": 545.1,
"r_y1": 570.6,
"r_x2": 545.1,
"r_y2": 561.7,
"r_x3": 308.9,
"r_y3": 561.7,
"coord_origin": "TOPLEFT"
},
"text": "finally rendered by a web browser engine to generate the",
"orig": "finally rendered by a web browser engine to generate the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 582.6,
"r_x1": 545.1,
"r_y1": 582.6,
"r_x2": 545.1,
"r_y2": 573.7,
"r_x3": 308.9,
"r_y3": 573.7,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes for each table cell. A batching technique is",
"orig": "bounding boxes for each table cell. A batching technique is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 594.5,
"r_x1": 545.1,
"r_y1": 594.5,
"r_x2": 545.1,
"r_y2": 585.6,
"r_x3": 308.9,
"r_y3": 585.6,
"coord_origin": "TOPLEFT"
},
"text": "utilized to optimize the runtime overhead of the rendering",
"orig": "utilized to optimize the runtime overhead of the rendering",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 606.5,
"r_x1": 341.2,
"r_y1": 606.5,
"r_x2": 341.2,
"r_y2": 597.6,
"r_x3": 308.9,
"r_y3": 597.6,
"coord_origin": "TOPLEFT"
},
"text": "process.",
"orig": "process.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5. Render the complete tables: The synthetic table is finally rendered by a web browser engine to generate the bounding boxes for each table cell. A batching technique is utilized to optimize the runtime overhead of the rendering process."
},
{
"label": "section_header",
"id": 10,
"page_no": 10,
"cluster": {
"id": 10,
"label": "section_header",
"bbox": {
"l": 308.9,
"t": 622.3,
"r": 545.1,
"b": 647.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 633.0,
"r_x1": 316.8,
"r_y1": 633.0,
"r_x2": 316.8,
"r_y2": 622.3,
"r_x3": 308.9,
"r_y3": 622.3,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.3,
"r_y0": 633.0,
"r_x1": 545.1,
"r_y1": 633.0,
"r_x2": 545.1,
"r_y2": 622.3,
"r_x3": 327.3,
"r_y3": 622.3,
"coord_origin": "TOPLEFT"
},
"text": "Prediction post-processing for PDF docu-",
"orig": "Prediction post-processing for PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 647.0,
"r_x1": 357.3,
"r_y1": 647.0,
"r_x2": 357.3,
"r_y2": 636.2,
"r_x3": 326.8,
"r_y3": 636.2,
"coord_origin": "TOPLEFT"
},
"text": "ments",
"orig": "ments",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "2. Prediction post-processing for PDF documents"
},
{
"label": "text",
"id": 1,
"page_no": 10,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 308.9,
"t": 657.4,
"r": 545.1,
"b": 714.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 666.3,
"r_x1": 545.1,
"r_y1": 666.3,
"r_x2": 545.1,
"r_y2": 657.4,
"r_x3": 320.8,
"r_y3": 657.4,
"coord_origin": "TOPLEFT"
},
"text": "Although TableFormer can predict the table structure and",
"orig": "Although TableFormer can predict the table structure and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 678.3,
"r_x1": 545.1,
"r_y1": 678.3,
"r_x2": 545.1,
"r_y2": 669.4,
"r_x3": 308.9,
"r_y3": 669.4,
"coord_origin": "TOPLEFT"
},
"text": "the bounding boxes for tables recognized inside PDF docu-",
"orig": "the bounding boxes for tables recognized inside PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 690.2,
"r_x1": 545.1,
"r_y1": 690.2,
"r_x2": 545.1,
"r_y2": 681.3,
"r_x3": 308.9,
"r_y3": 681.3,
"coord_origin": "TOPLEFT"
},
"text": "ments, this is not enough when a full reconstruction of the",
"orig": "ments, this is not enough when a full reconstruction of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 702.2,
"r_x1": 545.1,
"r_y1": 702.2,
"r_x2": 545.1,
"r_y2": 693.3,
"r_x3": 308.9,
"r_y3": 693.3,
"coord_origin": "TOPLEFT"
},
"text": "original table is required. This happens mainly due the fol-",
"orig": "original table is required. This happens mainly due the fol-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 714.1,
"r_x1": 371.4,
"r_y1": 714.1,
"r_x2": 371.4,
"r_y2": 705.2,
"r_x3": 308.9,
"r_y3": 705.2,
"coord_origin": "TOPLEFT"
},
"text": "lowing reasons:",
"orig": "lowing reasons:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Although TableFormer can predict the table structure and the bounding boxes for tables recognized inside PDF documents, this is not enough when a full reconstruction of the original table is required. This happens mainly due the following reasons:"
},
{
"label": "page_footer",
"id": 16,
"page_no": 10,
"cluster": {
"id": 16,
"label": "page_footer",
"bbox": {
"l": 292.6,
"t": 734.1,
"r": 302.6,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "11"
}
],
"body": [
{
"label": "section_header",
"id": 18,
"page_no": 10,
"cluster": {
"id": 18,
"label": "section_header",
"bbox": {
"l": 132.8,
"t": 110.6,
"r": 465.4,
"b": 135.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.65,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 132.8,
"r_y0": 121.3,
"r_x1": 465.4,
"r_y1": 121.3,
"r_x2": 465.4,
"r_y2": 110.6,
"r_x3": 132.8,
"r_y3": 110.6,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer: Table Structure Understanding with Transformers",
"orig": "TableFormer: Table Structure Understanding with Transformers",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.2,
"r_y0": 135.5,
"r_x1": 375.0,
"r_y1": 135.5,
"r_x2": 375.0,
"r_y2": 122.3,
"r_x3": 220.2,
"r_y3": 122.3,
"coord_origin": "TOPLEFT"
},
"text": "Supplementary Material",
"orig": "Supplementary Material",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "TableFormer: Table Structure Understanding with Transformers Supplementary Material"
},
{
"label": "section_header",
"id": 13,
"page_no": 10,
"cluster": {
"id": 13,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 161.2,
"r": 176.0,
"b": 171.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 171.9,
"r_x1": 57.1,
"r_y1": 171.9,
"r_x2": 57.1,
"r_y2": 161.2,
"r_x3": 50.1,
"r_y3": 161.2,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 66.4,
"r_y0": 171.9,
"r_x1": 176.0,
"r_y1": 171.9,
"r_x2": 176.0,
"r_y2": 161.2,
"r_x3": 66.4,
"r_y3": 161.2,
"coord_origin": "TOPLEFT"
},
"text": "Details on the datasets",
"orig": "Details on the datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1. Details on the datasets"
},
{
"label": "section_header",
"id": 11,
"page_no": 10,
"cluster": {
"id": 11,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 181.0,
"r": 150.4,
"b": 190.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 190.8,
"r_x1": 64.2,
"r_y1": 190.8,
"r_x2": 64.2,
"r_y2": 181.0,
"r_x3": 50.1,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "1.1.",
"orig": "1.1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.6,
"r_y0": 190.8,
"r_x1": 150.4,
"r_y1": 190.8,
"r_x2": 150.4,
"r_y2": 181.0,
"r_x3": 73.6,
"r_y3": 181.0,
"coord_origin": "TOPLEFT"
},
"text": "Data preparation",
"orig": "Data preparation",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1.1. Data preparation"
},
{
"label": "text",
"id": 0,
"page_no": 10,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 50.1,
"t": 199.9,
"r": 286.4,
"b": 388.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.99,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 208.8,
"r_x1": 286.4,
"r_y1": 208.8,
"r_x2": 286.4,
"r_y2": 199.9,
"r_x3": 62.1,
"r_y3": 199.9,
"coord_origin": "TOPLEFT"
},
"text": "As a first step of our data preparation process, we have",
"orig": "As a first step of our data preparation process, we have",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 220.8,
"r_x1": 286.4,
"r_y1": 220.8,
"r_x2": 286.4,
"r_y2": 211.9,
"r_x3": 50.1,
"r_y3": 211.9,
"coord_origin": "TOPLEFT"
},
"text": "calculated statistics over the datasets across the following",
"orig": "calculated statistics over the datasets across the following",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 232.7,
"r_x1": 286.4,
"r_y1": 232.7,
"r_x2": 286.4,
"r_y2": 223.8,
"r_x3": 50.1,
"r_y3": 223.8,
"coord_origin": "TOPLEFT"
},
"text": "dimensions: (1) table size measured in the number of rows",
"orig": "dimensions: (1) table size measured in the number of rows",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 244.7,
"r_x1": 286.4,
"r_y1": 244.7,
"r_x2": 286.4,
"r_y2": 235.8,
"r_x3": 50.1,
"r_y3": 235.8,
"coord_origin": "TOPLEFT"
},
"text": "and columns, (2) complexity of the table, (3) strictness of",
"orig": "and columns, (2) complexity of the table, (3) strictness of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 256.6,
"r_x1": 286.4,
"r_y1": 256.6,
"r_x2": 286.4,
"r_y2": 247.7,
"r_x3": 50.1,
"r_y3": 247.7,
"coord_origin": "TOPLEFT"
},
"text": "the provided HTML structure and (4) completeness (i.e. no",
"orig": "the provided HTML structure and (4) completeness (i.e. no",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 268.6,
"r_x1": 286.4,
"r_y1": 268.6,
"r_x2": 286.4,
"r_y2": 259.7,
"r_x3": 50.1,
"r_y3": 259.7,
"coord_origin": "TOPLEFT"
},
"text": "omitted bounding boxes). A table is considered to be simple",
"orig": "omitted bounding boxes). A table is considered to be simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 280.6,
"r_x1": 286.4,
"r_y1": 280.6,
"r_x2": 286.4,
"r_y2": 271.7,
"r_x3": 50.1,
"r_y3": 271.7,
"coord_origin": "TOPLEFT"
},
"text": "if it does not contain row spans or column spans. Addition-",
"orig": "if it does not contain row spans or column spans. Addition-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 292.5,
"r_x1": 286.4,
"r_y1": 292.5,
"r_x2": 286.4,
"r_y2": 283.6,
"r_x3": 50.1,
"r_y3": 283.6,
"coord_origin": "TOPLEFT"
},
"text": "ally, a table has a strict HTML structure if every row has the",
"orig": "ally, a table has a strict HTML structure if every row has the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 304.5,
"r_x1": 286.4,
"r_y1": 304.5,
"r_x2": 286.4,
"r_y2": 295.6,
"r_x3": 50.1,
"r_y3": 295.6,
"coord_origin": "TOPLEFT"
},
"text": "same number of columns after taking into account any row",
"orig": "same number of columns after taking into account any row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 316.4,
"r_x1": 286.4,
"r_y1": 316.4,
"r_x2": 286.4,
"r_y2": 307.5,
"r_x3": 50.1,
"r_y3": 307.5,
"coord_origin": "TOPLEFT"
},
"text": "or column spans. Therefore a strict HTML structure looks",
"orig": "or column spans. Therefore a strict HTML structure looks",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 328.4,
"r_x1": 286.4,
"r_y1": 328.4,
"r_x2": 286.4,
"r_y2": 319.5,
"r_x3": 50.1,
"r_y3": 319.5,
"coord_origin": "TOPLEFT"
},
"text": "always rectangular. However, HTML is a lenient encoding",
"orig": "always rectangular. However, HTML is a lenient encoding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 340.3,
"r_x1": 286.4,
"r_y1": 340.3,
"r_x2": 286.4,
"r_y2": 331.4,
"r_x3": 50.1,
"r_y3": 331.4,
"coord_origin": "TOPLEFT"
},
"text": "format, i.e. tables with rows of different sizes might still",
"orig": "format, i.e. tables with rows of different sizes might still",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 352.3,
"r_x1": 286.4,
"r_y1": 352.3,
"r_x2": 286.4,
"r_y2": 343.4,
"r_x3": 50.1,
"r_y3": 343.4,
"coord_origin": "TOPLEFT"
},
"text": "be regarded as correct due to implicit display rules. These",
"orig": "be regarded as correct due to implicit display rules. These",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 364.2,
"r_x1": 286.4,
"r_y1": 364.2,
"r_x2": 286.4,
"r_y2": 355.3,
"r_x3": 50.1,
"r_y3": 355.3,
"coord_origin": "TOPLEFT"
},
"text": "implicit rules leave room for ambiguity, which we want to",
"orig": "implicit rules leave room for ambiguity, which we want to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 376.2,
"r_x1": 286.4,
"r_y1": 376.2,
"r_x2": 286.4,
"r_y2": 367.3,
"r_x3": 50.1,
"r_y3": 367.3,
"coord_origin": "TOPLEFT"
},
"text": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables",
"orig": "avoid. As such, we prefer to have \u201dstrict\u201d tables, i.e. tables",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 388.2,
"r_x1": 230.8,
"r_y1": 388.2,
"r_x2": 230.8,
"r_y2": 379.2,
"r_x3": 50.1,
"r_y3": 379.2,
"coord_origin": "TOPLEFT"
},
"text": "where every row has exactly the same length.",
"orig": "where every row has exactly the same length.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "As a first step of our data preparation process, we have calculated statistics over the datasets across the following dimensions: (1) table size measured in the number of rows and columns, (2) complexity of the table, (3) strictness of the provided HTML structure and (4) completeness (i.e. no omitted bounding boxes). A table is considered to be simple if it does not contain row spans or column spans. Additionally, a table has a strict HTML structure if every row has the same number of columns after taking into account any row or column spans. Therefore a strict HTML structure looks always rectangular. However, HTML is a lenient encoding format, i.e. tables with rows of different sizes might still be regarded as correct due to implicit display rules. These implicit rules leave room for ambiguity, which we want to avoid. As such, we prefer to have \"strict\" tables, i.e. tables where every row has exactly the same length."
},
{
"label": "text",
"id": 2,
"page_no": 10,
"cluster": {
"id": 2,
"label": "text",
"bbox": {
"l": 50.1,
"t": 391.4,
"r": 286.4,
"b": 627.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 400.3,
"r_x1": 286.4,
"r_y1": 400.3,
"r_x2": 286.4,
"r_y2": 391.4,
"r_x3": 62.1,
"r_y3": 391.4,
"coord_origin": "TOPLEFT"
},
"text": "We have developed a technique that tries to derive a",
"orig": "We have developed a technique that tries to derive a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 412.3,
"r_x1": 286.4,
"r_y1": 412.3,
"r_x2": 286.4,
"r_y2": 403.4,
"r_x3": 50.1,
"r_y3": 403.4,
"coord_origin": "TOPLEFT"
},
"text": "missing bounding box out of its neighbors. As a first step,",
"orig": "missing bounding box out of its neighbors. As a first step,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 424.2,
"r_x1": 286.4,
"r_y1": 424.2,
"r_x2": 286.4,
"r_y2": 415.3,
"r_x3": 50.1,
"r_y3": 415.3,
"coord_origin": "TOPLEFT"
},
"text": "we use the annotation data to generate the most fine-grained",
"orig": "we use the annotation data to generate the most fine-grained",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 436.2,
"r_x1": 286.4,
"r_y1": 436.2,
"r_x2": 286.4,
"r_y2": 427.3,
"r_x3": 50.1,
"r_y3": 427.3,
"coord_origin": "TOPLEFT"
},
"text": "grid that covers the table structure. In case of strict HTML",
"orig": "grid that covers the table structure. In case of strict HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 448.1,
"r_x1": 286.4,
"r_y1": 448.1,
"r_x2": 286.4,
"r_y2": 439.2,
"r_x3": 50.1,
"r_y3": 439.2,
"coord_origin": "TOPLEFT"
},
"text": "tables, all grid squares are associated with some table cell",
"orig": "tables, all grid squares are associated with some table cell",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 460.1,
"r_x1": 286.4,
"r_y1": 460.1,
"r_x2": 286.4,
"r_y2": 451.2,
"r_x3": 50.1,
"r_y3": 451.2,
"coord_origin": "TOPLEFT"
},
"text": "and in the presence of table spans a cell extends across mul-",
"orig": "and in the presence of table spans a cell extends across mul-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 472.0,
"r_x1": 286.4,
"r_y1": 472.0,
"r_x2": 286.4,
"r_y2": 463.1,
"r_x3": 50.1,
"r_y3": 463.1,
"coord_origin": "TOPLEFT"
},
"text": "tiple grid squares. When enough bounding boxes are known",
"orig": "tiple grid squares. When enough bounding boxes are known",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 484.0,
"r_x1": 286.4,
"r_y1": 484.0,
"r_x2": 286.4,
"r_y2": 475.1,
"r_x3": 50.1,
"r_y3": 475.1,
"coord_origin": "TOPLEFT"
},
"text": "for a rectangular table, it is possible to compute the geo-",
"orig": "for a rectangular table, it is possible to compute the geo-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 496.0,
"r_x1": 286.4,
"r_y1": 496.0,
"r_x2": 286.4,
"r_y2": 487.0,
"r_x3": 50.1,
"r_y3": 487.0,
"coord_origin": "TOPLEFT"
},
"text": "metrical border lines between the grid rows and columns.",
"orig": "metrical border lines between the grid rows and columns.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 507.9,
"r_x1": 286.4,
"r_y1": 507.9,
"r_x2": 286.4,
"r_y2": 499.0,
"r_x3": 50.1,
"r_y3": 499.0,
"coord_origin": "TOPLEFT"
},
"text": "Eventually this information is used to generate the missing",
"orig": "Eventually this information is used to generate the missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 519.9,
"r_x1": 286.4,
"r_y1": 519.9,
"r_x2": 286.4,
"r_y2": 511.0,
"r_x3": 50.1,
"r_y3": 511.0,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes. Additionally, the existence of unused grid",
"orig": "bounding boxes. Additionally, the existence of unused grid",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 531.8,
"r_x1": 286.4,
"r_y1": 531.8,
"r_x2": 286.4,
"r_y2": 522.9,
"r_x3": 50.1,
"r_y3": 522.9,
"coord_origin": "TOPLEFT"
},
"text": "squares indicates that the table rows have unequal number",
"orig": "squares indicates that the table rows have unequal number",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 543.8,
"r_x1": 286.4,
"r_y1": 543.8,
"r_x2": 286.4,
"r_y2": 534.9,
"r_x3": 50.1,
"r_y3": 534.9,
"coord_origin": "TOPLEFT"
},
"text": "of columns and the overall structure is non-strict. The gen-",
"orig": "of columns and the overall structure is non-strict. The gen-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 555.7,
"r_x1": 286.4,
"r_y1": 555.7,
"r_x2": 286.4,
"r_y2": 546.8,
"r_x3": 50.1,
"r_y3": 546.8,
"coord_origin": "TOPLEFT"
},
"text": "eration of missing bounding boxes for non-strict HTML ta-",
"orig": "eration of missing bounding boxes for non-strict HTML ta-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 567.7,
"r_x1": 257.5,
"r_y1": 567.7,
"r_x2": 257.5,
"r_y2": 558.8,
"r_x3": 50.1,
"r_y3": 558.8,
"coord_origin": "TOPLEFT"
},
"text": "bles is ambiguous and therefore quite challenging.",
"orig": "bles is ambiguous and therefore quite challenging.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 263.9,
"r_y0": 567.7,
"r_x1": 286.4,
"r_y1": 567.7,
"r_x2": 286.4,
"r_y2": 558.8,
"r_x3": 263.9,
"r_y3": 558.8,
"coord_origin": "TOPLEFT"
},
"text": "Thus,",
"orig": "Thus,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 579.6,
"r_x1": 286.4,
"r_y1": 579.6,
"r_x2": 286.4,
"r_y2": 570.7,
"r_x3": 50.1,
"r_y3": 570.7,
"coord_origin": "TOPLEFT"
},
"text": "we have decided to simply discard those tables. In case of",
"orig": "we have decided to simply discard those tables. In case of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 591.6,
"r_x1": 286.4,
"r_y1": 591.6,
"r_x2": 286.4,
"r_y2": 582.7,
"r_x3": 50.1,
"r_y3": 582.7,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet we have computed missing bounding boxes for",
"orig": "PubTabNet we have computed missing bounding boxes for",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 603.5,
"r_x1": 286.4,
"r_y1": 603.5,
"r_x2": 286.4,
"r_y2": 594.6,
"r_x3": 50.1,
"r_y3": 594.6,
"coord_origin": "TOPLEFT"
},
"text": "48% of the simple and 69% of the complex tables. Regard-",
"orig": "48% of the simple and 69% of the complex tables. Regard-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 615.5,
"r_x1": 286.4,
"r_y1": 615.5,
"r_x2": 286.4,
"r_y2": 606.6,
"r_x3": 50.1,
"r_y3": 606.6,
"coord_origin": "TOPLEFT"
},
"text": "ing FinTabNet, 68% of the simple and 98% of the complex",
"orig": "ing FinTabNet, 68% of the simple and 98% of the complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 627.5,
"r_x1": 242.3,
"r_y1": 627.5,
"r_x2": 242.3,
"r_y2": 618.6,
"r_x3": 50.1,
"r_y3": 618.6,
"coord_origin": "TOPLEFT"
},
"text": "tables require the generation of bounding boxes.",
"orig": "tables require the generation of bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "We have developed a technique that tries to derive a missing bounding box out of its neighbors. As a first step, we use the annotation data to generate the most fine-grained grid that covers the table structure. In case of strict HTML tables, all grid squares are associated with some table cell and in the presence of table spans a cell extends across multiple grid squares. When enough bounding boxes are known for a rectangular table, it is possible to compute the geometrical border lines between the grid rows and columns. Eventually this information is used to generate the missing bounding boxes. Additionally, the existence of unused grid squares indicates that the table rows have unequal number of columns and the overall structure is non-strict. The generation of missing bounding boxes for non-strict HTML tables is ambiguous and therefore quite challenging. Thus, we have decided to simply discard those tables. In case of PubTabNet we have computed missing bounding boxes for 48% of the simple and 69% of the complex tables. Regarding FinTabNet, 68% of the simple and 98% of the complex tables require the generation of bounding boxes."
},
{
"label": "text",
"id": 14,
"page_no": 10,
"cluster": {
"id": 14,
"label": "text",
"bbox": {
"l": 50.1,
"t": 630.7,
"r": 286.4,
"b": 651.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 639.6,
"r_x1": 286.4,
"r_y1": 639.6,
"r_x2": 286.4,
"r_y2": 630.7,
"r_x3": 62.1,
"r_y3": 630.7,
"coord_origin": "TOPLEFT"
},
"text": "Figure 7 illustrates the distribution of the tables across",
"orig": "Figure 7 illustrates the distribution of the tables across",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 651.6,
"r_x1": 179.9,
"r_y1": 651.6,
"r_x2": 179.9,
"r_y2": 642.7,
"r_x3": 50.1,
"r_y3": 642.7,
"coord_origin": "TOPLEFT"
},
"text": "different dimensions per dataset.",
"orig": "different dimensions per dataset.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 7 illustrates the distribution of the tables across different dimensions per dataset."
},
{
"label": "section_header",
"id": 12,
"page_no": 10,
"cluster": {
"id": 12,
"label": "section_header",
"bbox": {
"l": 50.1,
"t": 662.4,
"r": 153.6,
"b": 672.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 672.2,
"r_x1": 64.3,
"r_y1": 672.2,
"r_x2": 64.3,
"r_y2": 662.4,
"r_x3": 50.1,
"r_y3": 662.4,
"coord_origin": "TOPLEFT"
},
"text": "1.2.",
"orig": "1.2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.8,
"r_y0": 672.2,
"r_x1": 153.6,
"r_y1": 672.2,
"r_x2": 153.6,
"r_y2": 662.4,
"r_x3": 73.8,
"r_y3": 662.4,
"coord_origin": "TOPLEFT"
},
"text": "Synthetic datasets",
"orig": "Synthetic datasets",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1.2. Synthetic datasets"
},
{
"label": "text",
"id": 3,
"page_no": 10,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 50.1,
"t": 681.3,
"r": 286.4,
"b": 714.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 690.2,
"r_x1": 286.4,
"r_y1": 690.2,
"r_x2": 286.4,
"r_y2": 681.3,
"r_x3": 62.1,
"r_y3": 681.3,
"coord_origin": "TOPLEFT"
},
"text": "Aiming to train and evaluate our models in a broader",
"orig": "Aiming to train and evaluate our models in a broader",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 702.2,
"r_x1": 286.4,
"r_y1": 702.2,
"r_x2": 286.4,
"r_y2": 693.3,
"r_x3": 50.1,
"r_y3": 693.3,
"coord_origin": "TOPLEFT"
},
"text": "spectrum of table data we have synthesized four types of",
"orig": "spectrum of table data we have synthesized four types of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 714.1,
"r_x1": 84.1,
"r_y1": 714.1,
"r_x2": 84.1,
"r_y2": 705.2,
"r_x3": 50.1,
"r_y3": 705.2,
"coord_origin": "TOPLEFT"
},
"text": "datasets.",
"orig": "datasets.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 91.2,
"r_y0": 714.1,
"r_x1": 286.4,
"r_y1": 714.1,
"r_x2": 286.4,
"r_y2": 705.2,
"r_x3": 91.2,
"r_y3": 705.2,
"coord_origin": "TOPLEFT"
},
"text": "Each one contains tables with different appear-",
"orig": "Each one contains tables with different appear-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Aiming to train and evaluate our models in a broader spectrum of table data we have synthesized four types of datasets. Each one contains tables with different appear-"
},
{
"label": "text",
"id": 8,
"page_no": 10,
"cluster": {
"id": 8,
"label": "text",
"bbox": {
"l": 308.9,
"t": 162.7,
"r": 545.1,
"b": 207.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 171.6,
"r_x1": 545.1,
"r_y1": 171.6,
"r_x2": 545.1,
"r_y2": 162.7,
"r_x3": 308.9,
"r_y3": 162.7,
"coord_origin": "TOPLEFT"
},
"text": "ances in regard to their size, structure, style and content.",
"orig": "ances in regard to their size, structure, style and content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 183.5,
"r_x1": 545.1,
"r_y1": 183.5,
"r_x2": 545.1,
"r_y2": 174.6,
"r_x3": 308.9,
"r_y3": 174.6,
"coord_origin": "TOPLEFT"
},
"text": "Every synthetic dataset contains 150k examples, summing",
"orig": "Every synthetic dataset contains 150k examples, summing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 195.5,
"r_x1": 545.1,
"r_y1": 195.5,
"r_x2": 545.1,
"r_y2": 186.6,
"r_x3": 308.9,
"r_y3": 186.6,
"coord_origin": "TOPLEFT"
},
"text": "up to 600k synthetic examples. All datasets are divided into",
"orig": "up to 600k synthetic examples. All datasets are divided into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 207.4,
"r_x1": 484.1,
"r_y1": 207.4,
"r_x2": 484.1,
"r_y2": 198.5,
"r_x3": 308.9,
"r_y3": 198.5,
"coord_origin": "TOPLEFT"
},
"text": "Train, Test and Val splits (80%, 10%, 10%).",
"orig": "Train, Test and Val splits (80%, 10%, 10%).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "ances in regard to their size, structure, style and content. Every synthetic dataset contains 150k examples, summing up to 600k synthetic examples. All datasets are divided into Train, Test and Val splits (80%, 10%, 10%)."
},
{
"label": "text",
"id": 15,
"page_no": 10,
"cluster": {
"id": 15,
"label": "text",
"bbox": {
"l": 308.9,
"t": 211.2,
"r": 545.1,
"b": 232.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 220.1,
"r_x1": 545.1,
"r_y1": 220.1,
"r_x2": 545.1,
"r_y2": 211.2,
"r_x3": 320.8,
"r_y3": 211.2,
"coord_origin": "TOPLEFT"
},
"text": "The process of generating a synthetic dataset can be de-",
"orig": "The process of generating a synthetic dataset can be de-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 232.1,
"r_x1": 448.1,
"r_y1": 232.1,
"r_x2": 448.1,
"r_y2": 223.2,
"r_x3": 308.9,
"r_y3": 223.2,
"coord_origin": "TOPLEFT"
},
"text": "composed into the following steps:",
"orig": "composed into the following steps:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "The process of generating a synthetic dataset can be decomposed into the following steps:"
},
{
"label": "list_item",
"id": 7,
"page_no": 10,
"cluster": {
"id": 7,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 235.9,
"r": 545.1,
"b": 316.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 244.8,
"r_x1": 328.3,
"r_y1": 244.8,
"r_x2": 328.3,
"r_y2": 235.9,
"r_x3": 320.8,
"r_y3": 235.9,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 335.4,
"r_y0": 244.8,
"r_x1": 545.1,
"r_y1": 244.8,
"r_x2": 545.1,
"r_y2": 235.9,
"r_x3": 335.4,
"r_y3": 235.9,
"coord_origin": "TOPLEFT"
},
"text": "Prepare styling and content templates: The styling",
"orig": "Prepare styling and content templates: The styling",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 256.8,
"r_x1": 545.1,
"r_y1": 256.8,
"r_x2": 545.1,
"r_y2": 247.9,
"r_x3": 308.9,
"r_y3": 247.9,
"coord_origin": "TOPLEFT"
},
"text": "templates have been manually designed and organized into",
"orig": "templates have been manually designed and organized into",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 268.7,
"r_x1": 545.1,
"r_y1": 268.7,
"r_x2": 545.1,
"r_y2": 259.8,
"r_x3": 308.9,
"r_y3": 259.8,
"coord_origin": "TOPLEFT"
},
"text": "groups of scope specific appearances (e.g. financial data,",
"orig": "groups of scope specific appearances (e.g. financial data,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 280.7,
"r_x1": 393.4,
"r_y1": 280.7,
"r_x2": 393.4,
"r_y2": 271.8,
"r_x3": 308.9,
"r_y3": 271.8,
"coord_origin": "TOPLEFT"
},
"text": "marketing data, etc.)",
"orig": "marketing data, etc.)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 400.1,
"r_y0": 280.7,
"r_x1": 545.1,
"r_y1": 280.7,
"r_x2": 545.1,
"r_y2": 271.8,
"r_x3": 400.1,
"r_y3": 271.8,
"coord_origin": "TOPLEFT"
},
"text": "Additionally, we have prepared cu-",
"orig": "Additionally, we have prepared cu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 292.6,
"r_x1": 545.1,
"r_y1": 292.6,
"r_x2": 545.1,
"r_y2": 283.7,
"r_x3": 308.9,
"r_y3": 283.7,
"coord_origin": "TOPLEFT"
},
"text": "rated collections of content templates by extracting the most",
"orig": "rated collections of content templates by extracting the most",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 304.6,
"r_x1": 545.1,
"r_y1": 304.6,
"r_x2": 545.1,
"r_y2": 295.7,
"r_x3": 308.9,
"r_y3": 295.7,
"coord_origin": "TOPLEFT"
},
"text": "frequently used terms out of non-synthetic datasets (e.g.",
"orig": "frequently used terms out of non-synthetic datasets (e.g.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 316.5,
"r_x1": 425.7,
"r_y1": 316.5,
"r_x2": 425.7,
"r_y2": 307.6,
"r_x3": 308.9,
"r_y3": 307.6,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet, FinTabNet, etc.).",
"orig": "PubTabNet, FinTabNet, etc.).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1. Prepare styling and content templates: The styling templates have been manually designed and organized into groups of scope specific appearances (e.g. financial data, marketing data, etc.) Additionally, we have prepared curated collections of content templates by extracting the most frequently used terms out of non-synthetic datasets (e.g. PubTabNet, FinTabNet, etc.)."
},
{
"label": "list_item",
"id": 6,
"page_no": 10,
"cluster": {
"id": 6,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 320.4,
"r": 545.1,
"b": 448.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 329.3,
"r_x1": 328.5,
"r_y1": 329.3,
"r_x2": 328.5,
"r_y2": 320.4,
"r_x3": 320.8,
"r_y3": 320.4,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.1,
"r_y0": 329.3,
"r_x1": 545.1,
"r_y1": 329.3,
"r_x2": 545.1,
"r_y2": 320.4,
"r_x3": 331.1,
"r_y3": 320.4,
"coord_origin": "TOPLEFT"
},
"text": "Generate table structures: The structure of each syn-",
"orig": "Generate table structures: The structure of each syn-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 341.2,
"r_x1": 545.1,
"r_y1": 341.2,
"r_x2": 545.1,
"r_y2": 332.3,
"r_x3": 308.9,
"r_y3": 332.3,
"coord_origin": "TOPLEFT"
},
"text": "thetic dataset assumes a horizontal table header which po-",
"orig": "thetic dataset assumes a horizontal table header which po-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 353.2,
"r_x1": 545.1,
"r_y1": 353.2,
"r_x2": 545.1,
"r_y2": 344.3,
"r_x3": 308.9,
"r_y3": 344.3,
"coord_origin": "TOPLEFT"
},
"text": "tentially spans over multiple rows and a table body that",
"orig": "tentially spans over multiple rows and a table body that",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 365.1,
"r_x1": 545.1,
"r_y1": 365.1,
"r_x2": 545.1,
"r_y2": 356.2,
"r_x3": 308.9,
"r_y3": 356.2,
"coord_origin": "TOPLEFT"
},
"text": "may contain a combination of row spans and column spans.",
"orig": "may contain a combination of row spans and column spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 377.1,
"r_x1": 545.1,
"r_y1": 377.1,
"r_x2": 545.1,
"r_y2": 368.2,
"r_x3": 308.9,
"r_y3": 368.2,
"coord_origin": "TOPLEFT"
},
"text": "However, spans are not allowed to cross the header - body",
"orig": "However, spans are not allowed to cross the header - body",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 389.0,
"r_x1": 545.1,
"r_y1": 389.0,
"r_x2": 545.1,
"r_y2": 380.1,
"r_x3": 308.9,
"r_y3": 380.1,
"coord_origin": "TOPLEFT"
},
"text": "boundary. The table structure is described by the parame-",
"orig": "boundary. The table structure is described by the parame-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 401.0,
"r_x1": 545.1,
"r_y1": 401.0,
"r_x2": 545.1,
"r_y2": 392.1,
"r_x3": 308.9,
"r_y3": 392.1,
"coord_origin": "TOPLEFT"
},
"text": "ters: Total number of table rows and columns, number of",
"orig": "ters: Total number of table rows and columns, number of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 412.9,
"r_x1": 545.1,
"r_y1": 412.9,
"r_x2": 545.1,
"r_y2": 404.0,
"r_x3": 308.9,
"r_y3": 404.0,
"coord_origin": "TOPLEFT"
},
"text": "header rows, type of spans (header only spans, row only",
"orig": "header rows, type of spans (header only spans, row only",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 424.9,
"r_x1": 545.1,
"r_y1": 424.9,
"r_x2": 545.1,
"r_y2": 416.0,
"r_x3": 308.9,
"r_y3": 416.0,
"coord_origin": "TOPLEFT"
},
"text": "spans, column only spans, both row and column spans),",
"orig": "spans, column only spans, both row and column spans),",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 436.9,
"r_x1": 545.1,
"r_y1": 436.9,
"r_x2": 545.1,
"r_y2": 427.9,
"r_x3": 308.9,
"r_y3": 427.9,
"coord_origin": "TOPLEFT"
},
"text": "maximum span size and the ratio of the table area covered",
"orig": "maximum span size and the ratio of the table area covered",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 448.8,
"r_x1": 345.9,
"r_y1": 448.8,
"r_x2": 345.9,
"r_y2": 439.9,
"r_x3": 308.9,
"r_y3": 439.9,
"coord_origin": "TOPLEFT"
},
"text": "by spans.",
"orig": "by spans.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "2. Generate table structures: The structure of each synthetic dataset assumes a horizontal table header which potentially spans over multiple rows and a table body that may contain a combination of row spans and column spans. However, spans are not allowed to cross the header - body boundary. The table structure is described by the parameters: Total number of table rows and columns, number of header rows, type of spans (header only spans, row only spans, column only spans, both row and column spans), maximum span size and the ratio of the table area covered by spans."
},
{
"label": "list_item",
"id": 9,
"page_no": 10,
"cluster": {
"id": 9,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 452.6,
"r": 545.1,
"b": 497.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 461.5,
"r_x1": 328.3,
"r_y1": 461.5,
"r_x2": 328.3,
"r_y2": 452.6,
"r_x3": 320.8,
"r_y3": 452.6,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.8,
"r_y0": 461.5,
"r_x1": 485.8,
"r_y1": 461.5,
"r_x2": 485.8,
"r_y2": 452.6,
"r_x3": 330.8,
"r_y3": 452.6,
"coord_origin": "TOPLEFT"
},
"text": "Generate content: Based on the dataset",
"orig": "Generate content: Based on the dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 488.1,
"r_y0": 461.3,
"r_x1": 511.9,
"r_y1": 461.3,
"r_x2": 511.9,
"r_y2": 452.7,
"r_x3": 488.1,
"r_y3": 452.7,
"coord_origin": "TOPLEFT"
},
"text": "theme",
"orig": "theme",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 511.9,
"r_y0": 461.5,
"r_x1": 545.1,
"r_y1": 461.5,
"r_x2": 545.1,
"r_y2": 452.6,
"r_x3": 511.9,
"r_y3": 452.6,
"coord_origin": "TOPLEFT"
},
"text": ", a set of",
"orig": ", a set of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 473.5,
"r_x1": 545.1,
"r_y1": 473.5,
"r_x2": 545.1,
"r_y2": 464.6,
"r_x3": 308.9,
"r_y3": 464.6,
"coord_origin": "TOPLEFT"
},
"text": "suitable content templates is chosen first. Then, this content",
"orig": "suitable content templates is chosen first. Then, this content",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 485.4,
"r_x1": 545.1,
"r_y1": 485.4,
"r_x2": 545.1,
"r_y2": 476.5,
"r_x3": 308.9,
"r_y3": 476.5,
"coord_origin": "TOPLEFT"
},
"text": "can be combined with purely random text to produce the",
"orig": "can be combined with purely random text to produce the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 497.4,
"r_x1": 379.1,
"r_y1": 497.4,
"r_x2": 379.1,
"r_y2": 488.5,
"r_x3": 308.9,
"r_y3": 488.5,
"coord_origin": "TOPLEFT"
},
"text": "synthetic content.",
"orig": "synthetic content.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "3. Generate content: Based on the dataset theme , a set of suitable content templates is chosen first. Then, this content can be combined with purely random text to produce the synthetic content."
},
{
"label": "list_item",
"id": 5,
"page_no": 10,
"cluster": {
"id": 5,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 501.2,
"r": 545.1,
"b": 546.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 510.1,
"r_x1": 328.7,
"r_y1": 510.1,
"r_x2": 328.7,
"r_y2": 501.2,
"r_x3": 320.8,
"r_y3": 501.2,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.3,
"r_y0": 510.1,
"r_x1": 545.1,
"r_y1": 510.1,
"r_x2": 545.1,
"r_y2": 501.2,
"r_x3": 331.3,
"r_y3": 501.2,
"coord_origin": "TOPLEFT"
},
"text": "Apply styling templates: Depending on the domain",
"orig": "Apply styling templates: Depending on the domain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 522.1,
"r_x1": 545.1,
"r_y1": 522.1,
"r_x2": 545.1,
"r_y2": 513.2,
"r_x3": 308.9,
"r_y3": 513.2,
"coord_origin": "TOPLEFT"
},
"text": "of the synthetic dataset, a set of styling templates is first",
"orig": "of the synthetic dataset, a set of styling templates is first",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 534.0,
"r_x1": 384.3,
"r_y1": 534.0,
"r_x2": 384.3,
"r_y2": 525.1,
"r_x3": 308.9,
"r_y3": 525.1,
"coord_origin": "TOPLEFT"
},
"text": "manually selected.",
"orig": "manually selected.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.3,
"r_y0": 534.0,
"r_x1": 545.1,
"r_y1": 534.0,
"r_x2": 545.1,
"r_y2": 525.1,
"r_x3": 391.3,
"r_y3": 525.1,
"coord_origin": "TOPLEFT"
},
"text": "Then, a style is randomly selected to",
"orig": "Then, a style is randomly selected to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 546.0,
"r_x1": 496.2,
"r_y1": 546.0,
"r_x2": 496.2,
"r_y2": 537.1,
"r_x3": 308.9,
"r_y3": 537.1,
"coord_origin": "TOPLEFT"
},
"text": "format the appearance of the synthesized table.",
"orig": "format the appearance of the synthesized table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "4. Apply styling templates: Depending on the domain of the synthetic dataset, a set of styling templates is first manually selected. Then, a style is randomly selected to format the appearance of the synthesized table."
},
{
"label": "list_item",
"id": 4,
"page_no": 10,
"cluster": {
"id": 4,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 549.8,
"r": 545.1,
"b": 606.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 558.7,
"r_x1": 328.3,
"r_y1": 558.7,
"r_x2": 328.3,
"r_y2": 549.8,
"r_x3": 320.8,
"r_y3": 549.8,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 335.4,
"r_y0": 558.7,
"r_x1": 545.1,
"r_y1": 558.7,
"r_x2": 545.1,
"r_y2": 549.8,
"r_x3": 335.4,
"r_y3": 549.8,
"coord_origin": "TOPLEFT"
},
"text": "Render the complete tables: The synthetic table is",
"orig": "Render the complete tables: The synthetic table is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 570.6,
"r_x1": 545.1,
"r_y1": 570.6,
"r_x2": 545.1,
"r_y2": 561.7,
"r_x3": 308.9,
"r_y3": 561.7,
"coord_origin": "TOPLEFT"
},
"text": "finally rendered by a web browser engine to generate the",
"orig": "finally rendered by a web browser engine to generate the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 582.6,
"r_x1": 545.1,
"r_y1": 582.6,
"r_x2": 545.1,
"r_y2": 573.7,
"r_x3": 308.9,
"r_y3": 573.7,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes for each table cell. A batching technique is",
"orig": "bounding boxes for each table cell. A batching technique is",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 594.5,
"r_x1": 545.1,
"r_y1": 594.5,
"r_x2": 545.1,
"r_y2": 585.6,
"r_x3": 308.9,
"r_y3": 585.6,
"coord_origin": "TOPLEFT"
},
"text": "utilized to optimize the runtime overhead of the rendering",
"orig": "utilized to optimize the runtime overhead of the rendering",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 606.5,
"r_x1": 341.2,
"r_y1": 606.5,
"r_x2": 341.2,
"r_y2": 597.6,
"r_x3": 308.9,
"r_y3": 597.6,
"coord_origin": "TOPLEFT"
},
"text": "process.",
"orig": "process.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5. Render the complete tables: The synthetic table is finally rendered by a web browser engine to generate the bounding boxes for each table cell. A batching technique is utilized to optimize the runtime overhead of the rendering process."
},
{
"label": "section_header",
"id": 10,
"page_no": 10,
"cluster": {
"id": 10,
"label": "section_header",
"bbox": {
"l": 308.9,
"t": 622.3,
"r": 545.1,
"b": 647.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 633.0,
"r_x1": 316.8,
"r_y1": 633.0,
"r_x2": 316.8,
"r_y2": 622.3,
"r_x3": 308.9,
"r_y3": 622.3,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.3,
"r_y0": 633.0,
"r_x1": 545.1,
"r_y1": 633.0,
"r_x2": 545.1,
"r_y2": 622.3,
"r_x3": 327.3,
"r_y3": 622.3,
"coord_origin": "TOPLEFT"
},
"text": "Prediction post-processing for PDF docu-",
"orig": "Prediction post-processing for PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.8,
"r_y0": 647.0,
"r_x1": 357.3,
"r_y1": 647.0,
"r_x2": 357.3,
"r_y2": 636.2,
"r_x3": 326.8,
"r_y3": 636.2,
"coord_origin": "TOPLEFT"
},
"text": "ments",
"orig": "ments",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "2. Prediction post-processing for PDF documents"
},
{
"label": "text",
"id": 1,
"page_no": 10,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 308.9,
"t": 657.4,
"r": 545.1,
"b": 714.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 666.3,
"r_x1": 545.1,
"r_y1": 666.3,
"r_x2": 545.1,
"r_y2": 657.4,
"r_x3": 320.8,
"r_y3": 657.4,
"coord_origin": "TOPLEFT"
},
"text": "Although TableFormer can predict the table structure and",
"orig": "Although TableFormer can predict the table structure and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 678.3,
"r_x1": 545.1,
"r_y1": 678.3,
"r_x2": 545.1,
"r_y2": 669.4,
"r_x3": 308.9,
"r_y3": 669.4,
"coord_origin": "TOPLEFT"
},
"text": "the bounding boxes for tables recognized inside PDF docu-",
"orig": "the bounding boxes for tables recognized inside PDF docu-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 690.2,
"r_x1": 545.1,
"r_y1": 690.2,
"r_x2": 545.1,
"r_y2": 681.3,
"r_x3": 308.9,
"r_y3": 681.3,
"coord_origin": "TOPLEFT"
},
"text": "ments, this is not enough when a full reconstruction of the",
"orig": "ments, this is not enough when a full reconstruction of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 702.2,
"r_x1": 545.1,
"r_y1": 702.2,
"r_x2": 545.1,
"r_y2": 693.3,
"r_x3": 308.9,
"r_y3": 693.3,
"coord_origin": "TOPLEFT"
},
"text": "original table is required. This happens mainly due the fol-",
"orig": "original table is required. This happens mainly due the fol-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 714.1,
"r_x1": 371.4,
"r_y1": 714.1,
"r_x2": 371.4,
"r_y2": 705.2,
"r_x3": 308.9,
"r_y3": 705.2,
"coord_origin": "TOPLEFT"
},
"text": "lowing reasons:",
"orig": "lowing reasons:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Although TableFormer can predict the table structure and the bounding boxes for tables recognized inside PDF documents, this is not enough when a full reconstruction of the original table is required. This happens mainly due the following reasons:"
}
],
"headers": [
{
"label": "page_footer",
"id": 16,
"page_no": 10,
"cluster": {
"id": 16,
"label": "page_footer",
"bbox": {
"l": 292.6,
"t": 734.1,
"r": 302.6,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "11",
"orig": "11",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "11"
}
]
}
},
{
"page_no": 11,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.4,
"r_y0": 83.3,
"r_x1": 151.9,
"r_y1": 83.3,
"r_x2": 151.9,
"r_y2": 77.3,
"r_x3": 119.4,
"r_y3": 77.3,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.3,
"r_y0": 81.1,
"r_x1": 59.3,
"r_y1": 81.1,
"r_x2": 59.3,
"r_y2": 75.2,
"r_x3": 53.3,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.6,
"r_y0": 83.4,
"r_x1": 319.8,
"r_y1": 83.4,
"r_x2": 319.8,
"r_y2": 77.5,
"r_x3": 289.6,
"r_y3": 77.5,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.4,
"r_y0": 83.2,
"r_x1": 481.8,
"r_y1": 83.2,
"r_x2": 481.8,
"r_y2": 77.3,
"r_x3": 448.4,
"r_y3": 77.3,
"coord_origin": "TOPLEFT"
},
"text": "Table Bank",
"orig": "Table Bank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.6,
"r_y0": 146.2,
"r_x1": 95.0,
"r_y1": 146.2,
"r_x2": 95.0,
"r_y2": 141.3,
"r_x3": 82.6,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Train",
"orig": "Train",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 63.0,
"r_y0": 106.1,
"r_x1": 85.3,
"r_y1": 106.1,
"r_x2": 85.3,
"r_y2": 101.1,
"r_x3": 63.0,
"r_y3": 101.1,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 129.4,
"r_x1": 85.2,
"r_y1": 129.4,
"r_x2": 85.2,
"r_y2": 124.4,
"r_x3": 67.8,
"r_y3": 124.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.6,
"r_y0": 107.5,
"r_x1": 249.8,
"r_y1": 107.5,
"r_x2": 249.8,
"r_y2": 102.5,
"r_x3": 227.6,
"r_y3": 102.5,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.2,
"r_y0": 131.9,
"r_x1": 249.7,
"r_y1": 131.9,
"r_x2": 249.7,
"r_y2": 127.0,
"r_x3": 232.2,
"r_y3": 127.0,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 119.0,
"r_x1": 413.7,
"r_y1": 119.0,
"r_x2": 413.7,
"r_y2": 114.0,
"r_x3": 396.2,
"r_y3": 114.0,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 97.4,
"r_y0": 146.2,
"r_x1": 105.1,
"r_y1": 146.2,
"r_x2": 105.1,
"r_y2": 141.3,
"r_x3": 97.4,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Val",
"orig": "Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.9,
"r_y0": 90.7,
"r_x1": 76.2,
"r_y1": 90.7,
"r_x2": 76.2,
"r_y2": 85.7,
"r_x3": 60.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.3,
"r_y0": 91.2,
"r_x1": 107.0,
"r_y1": 91.2,
"r_x2": 107.0,
"r_y2": 86.2,
"r_x3": 82.3,
"r_y3": 86.2,
"coord_origin": "TOPLEFT"
},
"text": "500K 10K",
"orig": "500K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.2,
"r_y0": 146.6,
"r_x1": 281.9,
"r_y1": 146.6,
"r_x2": 281.9,
"r_y2": 141.6,
"r_x3": 246.2,
"r_y3": 141.6,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 226.7,
"r_y0": 90.7,
"r_x1": 241.9,
"r_y1": 90.7,
"r_x2": 241.9,
"r_y2": 85.7,
"r_x3": 226.7,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 249.9,
"r_y0": 91.0,
"r_x1": 282.5,
"r_y1": 91.0,
"r_x2": 282.5,
"r_y2": 86.1,
"r_x3": 249.9,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "91K 10K 10K",
"orig": "91K 10K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.2,
"r_y0": 146.2,
"r_x1": 444.7,
"r_y1": 146.2,
"r_x2": 444.7,
"r_y2": 141.3,
"r_x3": 410.2,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.4,
"r_y0": 90.7,
"r_x1": 432.7,
"r_y1": 90.7,
"r_x2": 432.7,
"r_y2": 85.7,
"r_x3": 391.4,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "100% 130K 5K",
"orig": "100% 130K 5K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 435.6,
"r_y0": 91.2,
"r_x1": 445.6,
"r_y1": 91.2,
"r_x2": 445.6,
"r_y2": 86.3,
"r_x3": 435.6,
"r_y3": 86.3,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.9,
"r_y0": 146.2,
"r_x1": 136.2,
"r_y1": 146.2,
"r_x2": 136.2,
"r_y2": 141.3,
"r_x3": 113.9,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.9,
"r_y0": 99.8,
"r_x1": 127.1,
"r_y1": 99.8,
"r_x2": 127.1,
"r_y2": 94.8,
"r_x3": 116.9,
"r_y3": 94.8,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.3,
"r_y0": 105.9,
"r_x1": 127.1,
"r_y1": 105.9,
"r_x2": 127.1,
"r_y2": 100.9,
"r_x3": 113.3,
"r_y3": 100.9,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.9,
"r_y0": 112.0,
"r_x1": 127.1,
"r_y1": 112.0,
"r_x2": 127.1,
"r_y2": 107.1,
"r_x3": 112.9,
"r_y3": 107.1,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.2,
"r_y0": 127.6,
"r_x1": 127.0,
"r_y1": 127.6,
"r_x2": 127.0,
"r_y2": 122.6,
"r_x3": 113.2,
"r_y3": 122.6,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.9,
"r_y0": 133.7,
"r_x1": 127.0,
"r_y1": 133.7,
"r_x2": 127.0,
"r_y2": 128.7,
"r_x3": 112.9,
"r_y3": 128.7,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.6,
"r_y0": 146.4,
"r_x1": 156.0,
"r_y1": 146.4,
"r_x2": 156.0,
"r_y2": 141.4,
"r_x3": 138.6,
"r_y3": 141.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.0,
"r_y0": 91.2,
"r_x1": 151.0,
"r_y1": 91.2,
"r_x2": 151.0,
"r_y2": 86.3,
"r_x3": 122.0,
"r_y3": 86.3,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.7,
"r_y0": 91.5,
"r_x1": 321.7,
"r_y1": 91.5,
"r_x2": 321.7,
"r_y2": 86.6,
"r_x3": 311.7,
"r_y3": 86.6,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 287.9,
"r_y0": 146.7,
"r_x1": 310.1,
"r_y1": 146.7,
"r_x2": 310.1,
"r_y2": 141.7,
"r_x3": 287.9,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.2,
"r_y0": 98.0,
"r_x1": 299.4,
"r_y1": 98.0,
"r_x2": 299.4,
"r_y2": 93.1,
"r_x3": 289.2,
"r_y3": 93.1,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.6,
"r_y0": 104.2,
"r_x1": 299.4,
"r_y1": 104.2,
"r_x2": 299.4,
"r_y2": 99.2,
"r_x3": 285.6,
"r_y3": 99.2,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.3,
"r_y0": 110.3,
"r_x1": 299.4,
"r_y1": 110.3,
"r_x2": 299.4,
"r_y2": 105.3,
"r_x3": 285.3,
"r_y3": 105.3,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.4,
"r_y0": 125.3,
"r_x1": 299.2,
"r_y1": 125.3,
"r_x2": 299.2,
"r_y2": 120.4,
"r_x3": 285.4,
"r_y3": 120.4,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.1,
"r_y0": 131.5,
"r_x1": 299.2,
"r_y1": 131.5,
"r_x2": 299.2,
"r_y2": 126.5,
"r_x3": 285.1,
"r_y3": 126.5,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.3,
"r_y0": 146.7,
"r_x1": 328.8,
"r_y1": 146.7,
"r_x2": 328.8,
"r_y2": 141.7,
"r_x3": 311.3,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 299.6,
"r_y0": 91.7,
"r_x1": 309.6,
"r_y1": 91.7,
"r_x2": 309.6,
"r_y2": 86.7,
"r_x3": 299.6,
"r_y3": 86.7,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.0,
"r_y0": 146.6,
"r_x1": 483.5,
"r_y1": 146.6,
"r_x2": 483.5,
"r_y2": 141.7,
"r_x3": 466.0,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.0,
"r_y0": 98.7,
"r_x1": 469.2,
"r_y1": 98.7,
"r_x2": 469.2,
"r_y2": 93.8,
"r_x3": 459.0,
"r_y3": 93.8,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.4,
"r_y0": 104.8,
"r_x1": 469.2,
"r_y1": 104.8,
"r_x2": 469.2,
"r_y2": 99.9,
"r_x3": 455.4,
"r_y3": 99.9,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.0,
"r_y0": 111.0,
"r_x1": 469.2,
"r_y1": 111.0,
"r_x2": 469.2,
"r_y2": 106.0,
"r_x3": 455.0,
"r_y3": 106.0,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 467.4,
"r_y0": 90.5,
"r_x1": 480.7,
"r_y1": 90.5,
"r_x2": 480.7,
"r_y2": 85.6,
"r_x3": 467.4,
"r_y3": 85.6,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.4,
"r_y0": 146.5,
"r_x1": 182.6,
"r_y1": 146.5,
"r_x2": 182.6,
"r_y2": 141.6,
"r_x3": 160.4,
"r_y3": 141.6,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 153.7,
"r_y0": 99.8,
"r_x1": 173.3,
"r_y1": 99.8,
"r_x2": 173.3,
"r_y2": 94.9,
"r_x3": 153.7,
"r_y3": 94.9,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 154.5,
"r_y0": 105.9,
"r_x1": 173.3,
"r_y1": 105.9,
"r_x2": 173.3,
"r_y2": 101.0,
"r_x3": 154.5,
"r_y3": 101.0,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 155.3,
"r_y0": 112.1,
"r_x1": 173.3,
"r_y1": 112.1,
"r_x2": 173.3,
"r_y2": 107.1,
"r_x3": 155.3,
"r_y3": 107.1,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.4,
"r_y0": 112.2,
"r_x1": 346.0,
"r_y1": 112.2,
"r_x2": 346.0,
"r_y2": 107.2,
"r_x3": 326.4,
"r_y3": 107.2,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.2,
"r_y0": 118.3,
"r_x1": 346.0,
"r_y1": 118.3,
"r_x2": 346.0,
"r_y2": 113.4,
"r_x3": 327.2,
"r_y3": 113.4,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.9,
"r_y0": 124.4,
"r_x1": 346.0,
"r_y1": 124.4,
"r_x2": 346.0,
"r_y2": 119.5,
"r_x3": 327.9,
"r_y3": 119.5,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.0,
"r_y0": 109.1,
"r_x1": 508.8,
"r_y1": 109.1,
"r_x2": 508.8,
"r_y2": 104.2,
"r_x3": 489.0,
"r_y3": 104.2,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.2,
"r_y0": 115.2,
"r_x1": 508.8,
"r_y1": 115.2,
"r_x2": 508.8,
"r_y2": 110.3,
"r_x3": 490.2,
"r_y3": 110.3,
"coord_origin": "TOPLEFT"
},
"text": "doesn't",
"orig": "doesn't",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.7,
"r_y0": 121.4,
"r_x1": 508.8,
"r_y1": 121.4,
"r_x2": 508.8,
"r_y2": 116.4,
"r_x3": 489.7,
"r_y3": 116.4,
"coord_origin": "TOPLEFT"
},
"text": "provide",
"orig": "provide",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.7,
"r_y0": 127.5,
"r_x1": 508.8,
"r_y1": 127.5,
"r_x2": 508.8,
"r_y2": 122.5,
"r_x3": 490.7,
"r_y3": 122.5,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.4,
"r_y0": 146.7,
"r_x1": 202.8,
"r_y1": 146.7,
"r_x2": 202.8,
"r_y2": 141.7,
"r_x3": 185.4,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 168.5,
"r_y0": 91.1,
"r_x1": 197.5,
"r_y1": 91.1,
"r_x2": 197.5,
"r_y2": 86.1,
"r_x3": 168.5,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.4,
"r_y0": 91.0,
"r_x1": 367.4,
"r_y1": 91.0,
"r_x2": 367.4,
"r_y2": 86.0,
"r_x3": 357.4,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.7,
"r_y0": 146.6,
"r_x1": 374.9,
"r_y1": 146.6,
"r_x2": 374.9,
"r_y2": 141.6,
"r_x3": 333.7,
"r_y3": 141.6,
"coord_origin": "TOPLEFT"
},
"text": "Complex Simple",
"orig": "Complex Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.7,
"r_y0": 91.0,
"r_x1": 355.7,
"r_y1": 91.0,
"r_x2": 355.7,
"r_y2": 86.1,
"r_x3": 345.7,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.5,
"r_y0": 146.3,
"r_x1": 526.0,
"r_y1": 146.3,
"r_x2": 526.0,
"r_y2": 141.4,
"r_x3": 508.5,
"r_y3": 141.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 510.4,
"r_y0": 91.0,
"r_x1": 523.7,
"r_y1": 91.0,
"r_x2": 523.7,
"r_y2": 86.1,
"r_x3": 510.4,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 174.4,
"r_x1": 545.1,
"r_y1": 174.4,
"r_x2": 545.1,
"r_y2": 165.5,
"r_x3": 50.1,
"r_y3": 165.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,",
"orig": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 186.4,
"r_x1": 513.5,
"r_y1": 186.4,
"r_x2": 513.5,
"r_y2": 177.5,
"r_x3": 50.1,
"r_y3": 177.5,
"coord_origin": "TOPLEFT"
},
"text": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.",
"orig": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 219.8,
"r_x1": 71.1,
"r_y1": 219.8,
"r_x2": 71.1,
"r_y2": 210.9,
"r_x3": 61.6,
"r_y3": 210.9,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.5,
"r_y0": 219.8,
"r_x1": 286.4,
"r_y1": 219.8,
"r_x2": 286.4,
"r_y2": 210.9,
"r_x3": 73.5,
"r_y3": 210.9,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer output does not include the table cell con-",
"orig": "TableFormer output does not include the table cell con-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 231.8,
"r_x1": 87.5,
"r_y1": 231.8,
"r_x2": 87.5,
"r_y2": 222.9,
"r_x3": 70.0,
"r_y3": 222.9,
"coord_origin": "TOPLEFT"
},
"text": "tent.",
"orig": "tent.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 253.0,
"r_x1": 71.3,
"r_y1": 253.0,
"r_x2": 71.3,
"r_y2": 244.1,
"r_x3": 61.6,
"r_y3": 244.1,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.8,
"r_y0": 253.0,
"r_x1": 286.4,
"r_y1": 253.0,
"r_x2": 286.4,
"r_y2": 244.1,
"r_x3": 73.8,
"r_y3": 244.1,
"coord_origin": "TOPLEFT"
},
"text": "There are occasional inaccuracies in the predictions of",
"orig": "There are occasional inaccuracies in the predictions of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 264.9,
"r_x1": 150.4,
"r_y1": 264.9,
"r_x2": 150.4,
"r_y2": 256.0,
"r_x3": 70.0,
"r_y3": 256.0,
"coord_origin": "TOPLEFT"
},
"text": "the bounding boxes.",
"orig": "the bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 288.1,
"r_x1": 286.4,
"r_y1": 288.1,
"r_x2": 286.4,
"r_y2": 279.2,
"r_x3": 62.1,
"r_y3": 279.2,
"coord_origin": "TOPLEFT"
},
"text": "However, it is possible to mitigate those limitations by",
"orig": "However, it is possible to mitigate those limitations by",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 300.1,
"r_x1": 286.4,
"r_y1": 300.1,
"r_x2": 286.4,
"r_y2": 291.2,
"r_x3": 50.1,
"r_y3": 291.2,
"coord_origin": "TOPLEFT"
},
"text": "combining the TableFormer predictions with the informa-",
"orig": "combining the TableFormer predictions with the informa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 312.0,
"r_x1": 286.4,
"r_y1": 312.0,
"r_x2": 286.4,
"r_y2": 303.1,
"r_x3": 50.1,
"r_y3": 303.1,
"coord_origin": "TOPLEFT"
},
"text": "tion already present inside a programmatic PDF document.",
"orig": "tion already present inside a programmatic PDF document.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 324.0,
"r_x1": 286.4,
"r_y1": 324.0,
"r_x2": 286.4,
"r_y2": 315.1,
"r_x3": 50.1,
"r_y3": 315.1,
"coord_origin": "TOPLEFT"
},
"text": "More specifically, PDF documents can be seen as a se-",
"orig": "More specifically, PDF documents can be seen as a se-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 335.9,
"r_x1": 286.4,
"r_y1": 335.9,
"r_x2": 286.4,
"r_y2": 327.0,
"r_x3": 50.1,
"r_y3": 327.0,
"coord_origin": "TOPLEFT"
},
"text": "quence of PDF cells where each cell is described by its con-",
"orig": "quence of PDF cells where each cell is described by its con-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 347.9,
"r_x1": 286.4,
"r_y1": 347.9,
"r_x2": 286.4,
"r_y2": 339.0,
"r_x3": 50.1,
"r_y3": 339.0,
"coord_origin": "TOPLEFT"
},
"text": "tent and bounding box. If we are able to associate the PDF",
"orig": "tent and bounding box. If we are able to associate the PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 359.8,
"r_x1": 286.4,
"r_y1": 359.8,
"r_x2": 286.4,
"r_y2": 350.9,
"r_x3": 50.1,
"r_y3": 350.9,
"coord_origin": "TOPLEFT"
},
"text": "cells with the predicted table cells, we can directly link the",
"orig": "cells with the predicted table cells, we can directly link the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 371.8,
"r_x1": 286.4,
"r_y1": 371.8,
"r_x2": 286.4,
"r_y2": 362.9,
"r_x3": 50.1,
"r_y3": 362.9,
"coord_origin": "TOPLEFT"
},
"text": "PDF cell content to the table cell structure and use the PDF",
"orig": "PDF cell content to the table cell structure and use the PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 383.8,
"r_x1": 286.4,
"r_y1": 383.8,
"r_x2": 286.4,
"r_y2": 374.8,
"r_x3": 50.1,
"r_y3": 374.8,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes to correct misalignments in the predicted",
"orig": "bounding boxes to correct misalignments in the predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 395.7,
"r_x1": 154.6,
"r_y1": 395.7,
"r_x2": 154.6,
"r_y2": 386.8,
"r_x3": 50.1,
"r_y3": 386.8,
"coord_origin": "TOPLEFT"
},
"text": "table cell bounding boxes.",
"orig": "table cell bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 408.0,
"r_x1": 286.4,
"r_y1": 408.0,
"r_x2": 286.4,
"r_y2": 399.1,
"r_x3": 62.1,
"r_y3": 399.1,
"coord_origin": "TOPLEFT"
},
"text": "Here is a step-by-step description of the prediction post-",
"orig": "Here is a step-by-step description of the prediction post-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 419.9,
"r_x1": 95.5,
"r_y1": 419.9,
"r_x2": 95.5,
"r_y2": 411.0,
"r_x3": 50.1,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "processing:",
"orig": "processing:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 432.2,
"r_x1": 69.4,
"r_y1": 432.2,
"r_x2": 69.4,
"r_y2": 423.3,
"r_x3": 62.1,
"r_y3": 423.3,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.8,
"r_y0": 432.2,
"r_x1": 286.4,
"r_y1": 432.2,
"r_x2": 286.4,
"r_y2": 423.3,
"r_x3": 71.8,
"r_y3": 423.3,
"coord_origin": "TOPLEFT"
},
"text": "Get the minimal grid dimensions - number of rows and",
"orig": "Get the minimal grid dimensions - number of rows and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 444.2,
"r_x1": 286.4,
"r_y1": 444.2,
"r_x2": 286.4,
"r_y2": 435.3,
"r_x3": 50.1,
"r_y3": 435.3,
"coord_origin": "TOPLEFT"
},
"text": "columns for the predicted table structure. This represents",
"orig": "columns for the predicted table structure. This represents",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 456.1,
"r_x1": 274.5,
"r_y1": 456.1,
"r_x2": 274.5,
"r_y2": 447.2,
"r_x3": 50.1,
"r_y3": 447.2,
"coord_origin": "TOPLEFT"
},
"text": "the most granular grid for the underlying table structure.",
"orig": "the most granular grid for the underlying table structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 468.4,
"r_x1": 69.5,
"r_y1": 468.4,
"r_x2": 69.5,
"r_y2": 459.5,
"r_x3": 62.1,
"r_y3": 459.5,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 77.4,
"r_y0": 468.4,
"r_x1": 286.4,
"r_y1": 468.4,
"r_x2": 286.4,
"r_y2": 459.5,
"r_x3": 77.4,
"r_y3": 459.5,
"coord_origin": "TOPLEFT"
},
"text": "Generate pair-wise matches between the bounding",
"orig": "Generate pair-wise matches between the bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 480.3,
"r_x1": 286.4,
"r_y1": 480.3,
"r_x2": 286.4,
"r_y2": 471.4,
"r_x3": 50.1,
"r_y3": 471.4,
"coord_origin": "TOPLEFT"
},
"text": "boxes of the PDF cells and the predicted cells. The Intersec-",
"orig": "boxes of the PDF cells and the predicted cells. The Intersec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 492.3,
"r_x1": 286.4,
"r_y1": 492.3,
"r_x2": 286.4,
"r_y2": 483.4,
"r_x3": 50.1,
"r_y3": 483.4,
"coord_origin": "TOPLEFT"
},
"text": "tion Over Union (IOU) metric is used to evaluate the quality",
"orig": "tion Over Union (IOU) metric is used to evaluate the quality",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 504.2,
"r_x1": 110.7,
"r_y1": 504.2,
"r_x2": 110.7,
"r_y2": 495.3,
"r_x3": 50.1,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "of the matches.",
"orig": "of the matches.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 516.5,
"r_x1": 69.9,
"r_y1": 516.5,
"r_x2": 69.9,
"r_y2": 507.6,
"r_x3": 62.1,
"r_y3": 507.6,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 72.5,
"r_y0": 516.5,
"r_x1": 286.4,
"r_y1": 516.5,
"r_x2": 286.4,
"r_y2": 507.6,
"r_x3": 72.5,
"r_y3": 507.6,
"coord_origin": "TOPLEFT"
},
"text": "Use a carefully selected IOU threshold to designate",
"orig": "Use a carefully selected IOU threshold to designate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 528.5,
"r_x1": 226.1,
"r_y1": 528.5,
"r_x2": 226.1,
"r_y2": 519.6,
"r_x3": 50.1,
"r_y3": 519.6,
"coord_origin": "TOPLEFT"
},
"text": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.",
"orig": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 540.7,
"r_x1": 286.4,
"r_y1": 540.7,
"r_x2": 286.4,
"r_y2": 531.8,
"r_x3": 62.1,
"r_y3": 531.8,
"coord_origin": "TOPLEFT"
},
"text": "3.a. If all IOU scores in a column are below the thresh-",
"orig": "3.a. If all IOU scores in a column are below the thresh-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 552.7,
"r_x1": 286.4,
"r_y1": 552.7,
"r_x2": 286.4,
"r_y2": 543.8,
"r_x3": 50.1,
"r_y3": 543.8,
"coord_origin": "TOPLEFT"
},
"text": "old, discard all predictions (structure and bounding boxes)",
"orig": "old, discard all predictions (structure and bounding boxes)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 564.7,
"r_x1": 114.0,
"r_y1": 564.7,
"r_x2": 114.0,
"r_y2": 555.7,
"r_x3": 50.1,
"r_y3": 555.7,
"coord_origin": "TOPLEFT"
},
"text": "for that column.",
"orig": "for that column.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 576.9,
"r_x1": 69.5,
"r_y1": 576.9,
"r_x2": 69.5,
"r_y2": 568.0,
"r_x3": 62.1,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.7,
"r_y0": 576.9,
"r_x1": 286.4,
"r_y1": 576.9,
"r_x2": 286.4,
"r_y2": 568.0,
"r_x3": 76.7,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "Find the best-fitting content alignment for the pre-",
"orig": "Find the best-fitting content alignment for the pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 588.9,
"r_x1": 286.4,
"r_y1": 588.9,
"r_x2": 286.4,
"r_y2": 580.0,
"r_x3": 50.1,
"r_y3": 580.0,
"coord_origin": "TOPLEFT"
},
"text": "dicted cells with good IOU per each column. The alignment",
"orig": "dicted cells with good IOU per each column. The alignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 600.8,
"r_x1": 278.7,
"r_y1": 600.8,
"r_x2": 278.7,
"r_y2": 591.9,
"r_x3": 50.1,
"r_y3": 591.9,
"coord_origin": "TOPLEFT"
},
"text": "of the column can be identified by the following formula:",
"orig": "of the column can be identified by the following formula:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.0,
"r_y0": 632.8,
"r_x1": 158.0,
"r_y1": 632.8,
"r_x2": 158.0,
"r_y2": 624.0,
"r_x3": 112.0,
"r_y3": 624.0,
"coord_origin": "TOPLEFT"
},
"text": "alignment",
"orig": "alignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.7,
"r_y0": 632.8,
"r_x1": 203.5,
"r_y1": 632.8,
"r_x2": 203.5,
"r_y2": 624.0,
"r_x3": 160.7,
"r_y3": 624.0,
"coord_origin": "TOPLEFT"
},
"text": "= arg min",
"orig": "= arg min",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.6,
"r_y0": 640.2,
"r_x1": 189.1,
"r_y1": 640.2,
"r_x2": 189.1,
"r_y2": 634.0,
"r_x3": 185.6,
"r_y3": 634.0,
"coord_origin": "TOPLEFT"
},
"text": "c",
"orig": "c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 203.5,
"r_y0": 632.8,
"r_x1": 208.5,
"r_y1": 632.8,
"r_x2": 208.5,
"r_y2": 623.4,
"r_x3": 203.5,
"r_y3": 623.4,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.5,
"r_y0": 632.8,
"r_x1": 220.3,
"r_y1": 632.8,
"r_x2": 220.3,
"r_y2": 624.0,
"r_x3": 208.5,
"r_y3": 624.0,
"coord_origin": "TOPLEFT"
},
"text": "D$_{c}$",
"orig": "D$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 632.8,
"r_x1": 225.8,
"r_y1": 632.8,
"r_x2": 225.8,
"r_y2": 623.4,
"r_x3": 220.8,
"r_y3": 623.4,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.7,
"r_y0": 654.1,
"r_x1": 122.5,
"r_y1": 654.1,
"r_x2": 122.5,
"r_y2": 645.3,
"r_x3": 110.7,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "D$_{c}$",
"orig": "D$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.8,
"r_y0": 654.1,
"r_x1": 133.5,
"r_y1": 654.1,
"r_x2": 133.5,
"r_y2": 645.3,
"r_x3": 125.8,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 136.3,
"r_y0": 654.1,
"r_x1": 156.0,
"r_y1": 654.1,
"r_x2": 156.0,
"r_y2": 645.3,
"r_x3": 136.3,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "max",
"orig": "max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 156.0,
"r_y0": 654.1,
"r_x1": 161.0,
"r_y1": 654.1,
"r_x2": 161.0,
"r_y2": 644.7,
"r_x3": 156.0,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 161.0,
"r_y0": 654.1,
"r_x1": 170.2,
"r_y1": 654.1,
"r_x2": 170.2,
"r_y2": 645.3,
"r_x3": 161.0,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 170.7,
"r_y0": 654.1,
"r_x1": 185.7,
"r_y1": 654.1,
"r_x2": 185.7,
"r_y2": 644.7,
"r_x3": 170.7,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "} \u2212",
"orig": "} \u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.9,
"r_y0": 654.1,
"r_x1": 206.1,
"r_y1": 654.1,
"r_x2": 206.1,
"r_y2": 645.3,
"r_x3": 187.9,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "min",
"orig": "min",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.1,
"r_y0": 654.1,
"r_x1": 211.0,
"r_y1": 654.1,
"r_x2": 211.0,
"r_y2": 644.7,
"r_x3": 206.1,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.0,
"r_y0": 654.1,
"r_x1": 220.3,
"r_y1": 654.1,
"r_x2": 220.3,
"r_y2": 645.3,
"r_x3": 211.0,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 654.1,
"r_x1": 225.8,
"r_y1": 654.1,
"r_x2": 225.8,
"r_y2": 644.7,
"r_x3": 220.8,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.7,
"r_y0": 643.8,
"r_x1": 286.4,
"r_y1": 643.8,
"r_x2": 286.4,
"r_y2": 634.9,
"r_x3": 274.7,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "(4)",
"orig": "(4)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.0,
"r_x1": 74.5,
"r_y1": 677.0,
"r_x2": 74.5,
"r_y2": 668.1,
"r_x3": 50.1,
"r_y3": 668.1,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.3,
"r_y0": 676.8,
"r_x1": 82.6,
"r_y1": 676.8,
"r_x2": 82.6,
"r_y2": 667.9,
"r_x3": 78.3,
"r_y3": 667.9,
"coord_origin": "TOPLEFT"
},
"text": "c",
"orig": "c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.5,
"r_y0": 677.0,
"r_x1": 123.6,
"r_y1": 677.0,
"r_x2": 123.6,
"r_y2": 668.1,
"r_x3": 86.5,
"r_y3": 668.1,
"coord_origin": "TOPLEFT"
},
"text": "is one of",
"orig": "is one of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 127.5,
"r_y0": 676.8,
"r_x1": 132.5,
"r_y1": 676.8,
"r_x2": 132.5,
"r_y2": 667.3,
"r_x3": 127.5,
"r_y3": 667.3,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 132.5,
"r_y0": 677.0,
"r_x1": 210.7,
"r_y1": 677.0,
"r_x2": 210.7,
"r_y2": 668.1,
"r_x3": 132.5,
"r_y3": 668.1,
"coord_origin": "TOPLEFT"
},
"text": "left, centroid, right",
"orig": "left, centroid, right",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.7,
"r_y0": 676.8,
"r_x1": 215.7,
"r_y1": 676.8,
"r_x2": 215.7,
"r_y2": 667.3,
"r_x3": 210.7,
"r_y3": 667.3,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 219.6,
"r_y0": 677.0,
"r_x1": 233.9,
"r_y1": 677.0,
"r_x2": 233.9,
"r_y2": 668.1,
"r_x3": 219.6,
"r_y3": 668.1,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 237.8,
"r_y0": 676.8,
"r_x1": 247.1,
"r_y1": 676.8,
"r_x2": 247.1,
"r_y2": 667.9,
"r_x3": 237.8,
"r_y3": 667.9,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 251.5,
"r_y0": 677.0,
"r_x1": 286.4,
"r_y1": 677.0,
"r_x2": 286.4,
"r_y2": 668.1,
"r_x3": 251.5,
"r_y3": 668.1,
"coord_origin": "TOPLEFT"
},
"text": "is the x-",
"orig": "is the x-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 688.9,
"r_x1": 205.9,
"r_y1": 688.9,
"r_x2": 205.9,
"r_y2": 680.0,
"r_x3": 50.1,
"r_y3": 680.0,
"coord_origin": "TOPLEFT"
},
"text": "coordinate for the corresponding point.",
"orig": "coordinate for the corresponding point.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 701.2,
"r_x1": 69.5,
"r_y1": 701.2,
"r_x2": 69.5,
"r_y2": 692.3,
"r_x3": 62.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.3,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 76.3,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "Use the alignment computed in step 4, to compute",
"orig": "Use the alignment computed in step 4, to compute",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 94.6,
"r_y1": 713.2,
"r_x2": 94.6,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "the median",
"orig": "the median",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 97.6,
"r_y0": 712.9,
"r_x1": 103.3,
"r_y1": 712.9,
"r_x2": 103.3,
"r_y2": 704.1,
"r_x3": 97.6,
"r_y3": 704.1,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.3,
"r_y0": 713.2,
"r_x1": 286.4,
"r_y1": 713.2,
"r_x2": 286.4,
"r_y2": 704.2,
"r_x3": 103.3,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "-coordinate for all table columns and the me-",
"orig": "-coordinate for all table columns and the me-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 219.8,
"r_x1": 545.1,
"r_y1": 219.8,
"r_x2": 545.1,
"r_y2": 210.9,
"r_x3": 308.9,
"r_y3": 210.9,
"coord_origin": "TOPLEFT"
},
"text": "dian cell size for all table cells. The usage of median dur-",
"orig": "dian cell size for all table cells. The usage of median dur-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 231.8,
"r_x1": 545.1,
"r_y1": 231.8,
"r_x2": 545.1,
"r_y2": 222.9,
"r_x3": 308.9,
"r_y3": 222.9,
"coord_origin": "TOPLEFT"
},
"text": "ing the computations, helps to eliminate outliers caused by",
"orig": "ing the computations, helps to eliminate outliers caused by",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 243.7,
"r_x1": 545.1,
"r_y1": 243.7,
"r_x2": 545.1,
"r_y2": 234.8,
"r_x3": 308.9,
"r_y3": 234.8,
"coord_origin": "TOPLEFT"
},
"text": "occasional column spans which are usually wider than the",
"orig": "occasional column spans which are usually wider than the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 255.7,
"r_x1": 339.6,
"r_y1": 255.7,
"r_x2": 339.6,
"r_y2": 246.8,
"r_x3": 308.9,
"r_y3": 246.8,
"coord_origin": "TOPLEFT"
},
"text": "normal.",
"orig": "normal.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 268.0,
"r_x1": 328.3,
"r_y1": 268.0,
"r_x2": 328.3,
"r_y2": 259.1,
"r_x3": 320.8,
"r_y3": 259.1,
"coord_origin": "TOPLEFT"
},
"text": "6.",
"orig": "6.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 334.9,
"r_y0": 268.0,
"r_x1": 545.1,
"r_y1": 268.0,
"r_x2": 545.1,
"r_y2": 259.1,
"r_x3": 334.9,
"r_y3": 259.1,
"coord_origin": "TOPLEFT"
},
"text": "Snap all cells with bad IOU to their corresponding",
"orig": "Snap all cells with bad IOU to their corresponding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 280.0,
"r_x1": 338.2,
"r_y1": 280.0,
"r_x2": 338.2,
"r_y2": 271.1,
"r_x3": 308.9,
"r_y3": 271.1,
"coord_origin": "TOPLEFT"
},
"text": "median",
"orig": "median",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 340.7,
"r_y0": 279.7,
"r_x1": 346.4,
"r_y1": 279.7,
"r_x2": 346.4,
"r_y2": 270.9,
"r_x3": 340.7,
"r_y3": 270.9,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.4,
"r_y0": 280.0,
"r_x1": 453.7,
"r_y1": 280.0,
"r_x2": 453.7,
"r_y2": 271.1,
"r_x3": 346.4,
"r_y3": 271.1,
"coord_origin": "TOPLEFT"
},
"text": "-coordinates and cell sizes.",
"orig": "-coordinates and cell sizes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 292.3,
"r_x1": 328.4,
"r_y1": 292.3,
"r_x2": 328.4,
"r_y2": 283.4,
"r_x3": 320.8,
"r_y3": 283.4,
"coord_origin": "TOPLEFT"
},
"text": "7.",
"orig": "7.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.9,
"r_y0": 292.3,
"r_x1": 545.1,
"r_y1": 292.3,
"r_x2": 545.1,
"r_y2": 283.4,
"r_x3": 330.9,
"r_y3": 283.4,
"coord_origin": "TOPLEFT"
},
"text": "Generate a new set of pair-wise matches between the",
"orig": "Generate a new set of pair-wise matches between the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 304.2,
"r_x1": 545.1,
"r_y1": 304.2,
"r_x2": 545.1,
"r_y2": 295.3,
"r_x3": 308.9,
"r_y3": 295.3,
"coord_origin": "TOPLEFT"
},
"text": "corrected bounding boxes and PDF cells. This time use a",
"orig": "corrected bounding boxes and PDF cells. This time use a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 316.2,
"r_x1": 545.1,
"r_y1": 316.2,
"r_x2": 545.1,
"r_y2": 307.3,
"r_x3": 308.9,
"r_y3": 307.3,
"coord_origin": "TOPLEFT"
},
"text": "modified version of the IOU metric, where the area of the",
"orig": "modified version of the IOU metric, where the area of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 328.1,
"r_x1": 545.1,
"r_y1": 328.1,
"r_x2": 545.1,
"r_y2": 319.2,
"r_x3": 308.9,
"r_y3": 319.2,
"coord_origin": "TOPLEFT"
},
"text": "intersection between the predicted and PDF cells is divided",
"orig": "intersection between the predicted and PDF cells is divided",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 340.1,
"r_x1": 397.2,
"r_y1": 340.1,
"r_x2": 397.2,
"r_y2": 331.2,
"r_x3": 308.9,
"r_y3": 331.2,
"coord_origin": "TOPLEFT"
},
"text": "by the PDF cell area.",
"orig": "by the PDF cell area.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.7,
"r_y0": 340.1,
"r_x1": 545.1,
"r_y1": 340.1,
"r_x2": 545.1,
"r_y2": 331.2,
"r_x3": 403.7,
"r_y3": 331.2,
"coord_origin": "TOPLEFT"
},
"text": "In case there are multiple matches",
"orig": "In case there are multiple matches",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 352.0,
"r_x1": 545.1,
"r_y1": 352.0,
"r_x2": 545.1,
"r_y2": 343.1,
"r_x3": 308.9,
"r_y3": 343.1,
"coord_origin": "TOPLEFT"
},
"text": "for the same PDF cell, the prediction with the higher score",
"orig": "for the same PDF cell, the prediction with the higher score",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 364.0,
"r_x1": 545.1,
"r_y1": 364.0,
"r_x2": 545.1,
"r_y2": 355.1,
"r_x3": 308.9,
"r_y3": 355.1,
"coord_origin": "TOPLEFT"
},
"text": "is preferred. This covers the cases where the PDF cells are",
"orig": "is preferred. This covers the cases where the PDF cells are",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 376.0,
"r_x1": 545.1,
"r_y1": 376.0,
"r_x2": 545.1,
"r_y2": 367.0,
"r_x3": 308.9,
"r_y3": 367.0,
"coord_origin": "TOPLEFT"
},
"text": "smaller than the area of predicted or corrected prediction",
"orig": "smaller than the area of predicted or corrected prediction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 387.9,
"r_x1": 329.6,
"r_y1": 387.9,
"r_x2": 329.6,
"r_y2": 379.0,
"r_x3": 308.9,
"r_y3": 379.0,
"coord_origin": "TOPLEFT"
},
"text": "cells.",
"orig": "cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 400.2,
"r_x1": 328.6,
"r_y1": 400.2,
"r_x2": 328.6,
"r_y2": 391.3,
"r_x3": 320.8,
"r_y3": 391.3,
"coord_origin": "TOPLEFT"
},
"text": "8.",
"orig": "8.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.1,
"r_y0": 400.2,
"r_x1": 545.1,
"r_y1": 400.2,
"r_x2": 545.1,
"r_y2": 391.3,
"r_x3": 331.1,
"r_y3": 391.3,
"coord_origin": "TOPLEFT"
},
"text": "In some rare occasions, we have noticed that Table-",
"orig": "In some rare occasions, we have noticed that Table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 412.2,
"r_x1": 545.1,
"r_y1": 412.2,
"r_x2": 545.1,
"r_y2": 403.3,
"r_x3": 308.9,
"r_y3": 403.3,
"coord_origin": "TOPLEFT"
},
"text": "Former can confuse a single column as two. When the post-",
"orig": "Former can confuse a single column as two. When the post-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 424.1,
"r_x1": 545.1,
"r_y1": 424.1,
"r_x2": 545.1,
"r_y2": 415.2,
"r_x3": 308.9,
"r_y3": 415.2,
"coord_origin": "TOPLEFT"
},
"text": "processing steps are applied, this results with two predicted",
"orig": "processing steps are applied, this results with two predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 436.1,
"r_x1": 545.1,
"r_y1": 436.1,
"r_x2": 545.1,
"r_y2": 427.2,
"r_x3": 308.9,
"r_y3": 427.2,
"coord_origin": "TOPLEFT"
},
"text": "columns pointing to the same PDF column. In such case",
"orig": "columns pointing to the same PDF column. In such case",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 448.0,
"r_x1": 545.1,
"r_y1": 448.0,
"r_x2": 545.1,
"r_y2": 439.1,
"r_x3": 308.9,
"r_y3": 439.1,
"coord_origin": "TOPLEFT"
},
"text": "we must de-duplicate the columns according to highest to-",
"orig": "we must de-duplicate the columns according to highest to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 460.0,
"r_x1": 426.2,
"r_y1": 460.0,
"r_x2": 426.2,
"r_y2": 451.1,
"r_x3": 308.9,
"r_y3": 451.1,
"coord_origin": "TOPLEFT"
},
"text": "tal column intersection score.",
"orig": "tal column intersection score.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 472.3,
"r_x1": 328.7,
"r_y1": 472.3,
"r_x2": 328.7,
"r_y2": 463.4,
"r_x3": 320.8,
"r_y3": 463.4,
"coord_origin": "TOPLEFT"
},
"text": "9.",
"orig": "9.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.3,
"r_y0": 472.3,
"r_x1": 545.1,
"r_y1": 472.3,
"r_x2": 545.1,
"r_y2": 463.4,
"r_x3": 331.3,
"r_y3": 463.4,
"coord_origin": "TOPLEFT"
},
"text": "Pick up the remaining orphan cells. There could be",
"orig": "Pick up the remaining orphan cells. There could be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 484.3,
"r_x1": 545.1,
"r_y1": 484.3,
"r_x2": 545.1,
"r_y2": 475.3,
"r_x3": 308.9,
"r_y3": 475.3,
"coord_origin": "TOPLEFT"
},
"text": "cases, when after applying all the previous post-processing",
"orig": "cases, when after applying all the previous post-processing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 496.2,
"r_x1": 545.1,
"r_y1": 496.2,
"r_x2": 545.1,
"r_y2": 487.3,
"r_x3": 308.9,
"r_y3": 487.3,
"coord_origin": "TOPLEFT"
},
"text": "steps, some PDF cells could still remain without any match",
"orig": "steps, some PDF cells could still remain without any match",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 508.2,
"r_x1": 381.9,
"r_y1": 508.2,
"r_x2": 381.9,
"r_y2": 499.3,
"r_x3": 308.9,
"r_y3": 499.3,
"coord_origin": "TOPLEFT"
},
"text": "to predicted cells.",
"orig": "to predicted cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 388.7,
"r_y0": 508.2,
"r_x1": 545.1,
"r_y1": 508.2,
"r_x2": 545.1,
"r_y2": 499.3,
"r_x3": 388.7,
"r_y3": 499.3,
"coord_origin": "TOPLEFT"
},
"text": "However, it is still possible to deduce",
"orig": "However, it is still possible to deduce",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 520.1,
"r_x1": 545.1,
"r_y1": 520.1,
"r_x2": 545.1,
"r_y2": 511.2,
"r_x3": 308.9,
"r_y3": 511.2,
"coord_origin": "TOPLEFT"
},
"text": "the correct matching for an orphan PDF cell by mapping its",
"orig": "the correct matching for an orphan PDF cell by mapping its",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 532.1,
"r_x1": 545.1,
"r_y1": 532.1,
"r_x2": 545.1,
"r_y2": 523.2,
"r_x3": 308.9,
"r_y3": 523.2,
"coord_origin": "TOPLEFT"
},
"text": "bounding box on the geometry of the grid. This mapping",
"orig": "bounding box on the geometry of the grid. This mapping",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 544.0,
"r_x1": 545.1,
"r_y1": 544.0,
"r_x2": 545.1,
"r_y2": 535.1,
"r_x3": 308.9,
"r_y3": 535.1,
"coord_origin": "TOPLEFT"
},
"text": "decides if the content of the orphan cell will be appended to",
"orig": "decides if the content of the orphan cell will be appended to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 556.0,
"r_x1": 545.1,
"r_y1": 556.0,
"r_x2": 545.1,
"r_y2": 547.1,
"r_x3": 308.9,
"r_y3": 547.1,
"coord_origin": "TOPLEFT"
},
"text": "an already matched table cell, or a new table cell should be",
"orig": "an already matched table cell, or a new table cell should be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 567.9,
"r_x1": 442.2,
"r_y1": 567.9,
"r_x2": 442.2,
"r_y2": 559.0,
"r_x3": 308.9,
"r_y3": 559.0,
"coord_origin": "TOPLEFT"
},
"text": "created to match with the orphan.",
"orig": "created to match with the orphan.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 580.2,
"r_x1": 545.1,
"r_y1": 580.2,
"r_x2": 545.1,
"r_y2": 571.3,
"r_x3": 320.8,
"r_y3": 571.3,
"coord_origin": "TOPLEFT"
},
"text": "9a. Compute the top and bottom boundary of the hori-",
"orig": "9a. Compute the top and bottom boundary of the hori-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 592.2,
"r_x1": 471.6,
"r_y1": 592.2,
"r_x2": 471.6,
"r_y2": 583.3,
"r_x3": 308.9,
"r_y3": 583.3,
"coord_origin": "TOPLEFT"
},
"text": "zontal band for each grid row (min/max",
"orig": "zontal band for each grid row (min/max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 474.8,
"r_y0": 592.0,
"r_x1": 479.7,
"r_y1": 592.0,
"r_x2": 479.7,
"r_y2": 583.1,
"r_x3": 474.8,
"r_y3": 583.1,
"coord_origin": "TOPLEFT"
},
"text": "y",
"orig": "y",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.3,
"r_y0": 592.2,
"r_x1": 545.1,
"r_y1": 592.2,
"r_x2": 545.1,
"r_y2": 583.3,
"r_x3": 483.3,
"r_y3": 583.3,
"coord_origin": "TOPLEFT"
},
"text": "coordinates per",
"orig": "coordinates per",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 604.2,
"r_x1": 329.9,
"r_y1": 604.2,
"r_x2": 329.9,
"r_y2": 595.2,
"r_x3": 308.9,
"r_y3": 595.2,
"coord_origin": "TOPLEFT"
},
"text": "row).",
"orig": "row).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 616.5,
"r_x1": 332.9,
"r_y1": 616.5,
"r_x2": 332.9,
"r_y2": 607.6,
"r_x3": 320.8,
"r_y3": 607.6,
"coord_origin": "TOPLEFT"
},
"text": "9b.",
"orig": "9b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.9,
"r_y0": 616.5,
"r_x1": 545.1,
"r_y1": 616.5,
"r_x2": 545.1,
"r_y2": 607.6,
"r_x3": 339.9,
"r_y3": 607.6,
"coord_origin": "TOPLEFT"
},
"text": "Intersect the orphan\u2019s bounding box with the row",
"orig": "Intersect the orphan\u2019s bounding box with the row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 628.4,
"r_x1": 495.3,
"r_y1": 628.4,
"r_x2": 495.3,
"r_y2": 619.5,
"r_x3": 308.9,
"r_y3": 619.5,
"coord_origin": "TOPLEFT"
},
"text": "bands, and map the cell to the closest grid row.",
"orig": "bands, and map the cell to the closest grid row.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 640.7,
"r_x1": 545.1,
"r_y1": 640.7,
"r_x2": 545.1,
"r_y2": 631.8,
"r_x3": 320.8,
"r_y3": 631.8,
"coord_origin": "TOPLEFT"
},
"text": "9c. Compute the left and right boundary of the vertical",
"orig": "9c. Compute the left and right boundary of the vertical",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 652.7,
"r_x1": 455.3,
"r_y1": 652.7,
"r_x2": 455.3,
"r_y2": 643.8,
"r_x3": 308.9,
"r_y3": 643.8,
"coord_origin": "TOPLEFT"
},
"text": "band for each grid column (min/max",
"orig": "band for each grid column (min/max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 457.8,
"r_y0": 652.5,
"r_x1": 463.5,
"r_y1": 652.5,
"r_x2": 463.5,
"r_y2": 643.6,
"r_x3": 457.8,
"r_y3": 643.6,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.0,
"r_y0": 652.7,
"r_x1": 545.1,
"r_y1": 652.7,
"r_x2": 545.1,
"r_y2": 643.8,
"r_x3": 466.0,
"r_y3": 643.8,
"coord_origin": "TOPLEFT"
},
"text": "coordinates per col-",
"orig": "coordinates per col-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 664.6,
"r_x1": 332.4,
"r_y1": 664.6,
"r_x2": 332.4,
"r_y2": 655.7,
"r_x3": 308.9,
"r_y3": 655.7,
"coord_origin": "TOPLEFT"
},
"text": "umn).",
"orig": "umn).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 676.9,
"r_x1": 545.1,
"r_y1": 676.9,
"r_x2": 545.1,
"r_y2": 668.0,
"r_x3": 320.8,
"r_y3": 668.0,
"coord_origin": "TOPLEFT"
},
"text": "9d. Intersect the orphan\u2019s bounding box with the column",
"orig": "9d. Intersect the orphan\u2019s bounding box with the column",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 688.9,
"r_x1": 510.6,
"r_y1": 688.9,
"r_x2": 510.6,
"r_y2": 680.0,
"r_x3": 308.9,
"r_y3": 680.0,
"coord_origin": "TOPLEFT"
},
"text": "bands, and map the cell to the closest grid column.",
"orig": "bands, and map the cell to the closest grid column.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 320.8,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "9e. If the table cell under the identified row and column",
"orig": "9e. If the table cell under the identified row and column",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 545.1,
"r_y1": 713.2,
"r_x2": 545.1,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "is not empty, extend its content with the content of the or-",
"orig": "is not empty, extend its content with the content of the or-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 30,
"label": "picture",
"bbox": {
"l": 53.5,
"t": 74.7,
"r": 544.9,
"b": 147.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.6,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.4,
"r_y0": 83.3,
"r_x1": 151.9,
"r_y1": 83.3,
"r_x2": 151.9,
"r_y2": 77.3,
"r_x3": 119.4,
"r_y3": 77.3,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.3,
"r_y0": 81.1,
"r_x1": 59.3,
"r_y1": 81.1,
"r_x2": 59.3,
"r_y2": 75.2,
"r_x3": 53.3,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.6,
"r_y0": 83.4,
"r_x1": 319.8,
"r_y1": 83.4,
"r_x2": 319.8,
"r_y2": 77.5,
"r_x3": 289.6,
"r_y3": 77.5,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.4,
"r_y0": 83.2,
"r_x1": 481.8,
"r_y1": 83.2,
"r_x2": 481.8,
"r_y2": 77.3,
"r_x3": 448.4,
"r_y3": 77.3,
"coord_origin": "TOPLEFT"
},
"text": "Table Bank",
"orig": "Table Bank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.6,
"r_y0": 146.2,
"r_x1": 95.0,
"r_y1": 146.2,
"r_x2": 95.0,
"r_y2": 141.3,
"r_x3": 82.6,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Train",
"orig": "Train",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 63.0,
"r_y0": 106.1,
"r_x1": 85.3,
"r_y1": 106.1,
"r_x2": 85.3,
"r_y2": 101.1,
"r_x3": 63.0,
"r_y3": 101.1,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 129.4,
"r_x1": 85.2,
"r_y1": 129.4,
"r_x2": 85.2,
"r_y2": 124.4,
"r_x3": 67.8,
"r_y3": 124.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.6,
"r_y0": 107.5,
"r_x1": 249.8,
"r_y1": 107.5,
"r_x2": 249.8,
"r_y2": 102.5,
"r_x3": 227.6,
"r_y3": 102.5,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.2,
"r_y0": 131.9,
"r_x1": 249.7,
"r_y1": 131.9,
"r_x2": 249.7,
"r_y2": 127.0,
"r_x3": 232.2,
"r_y3": 127.0,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 119.0,
"r_x1": 413.7,
"r_y1": 119.0,
"r_x2": 413.7,
"r_y2": 114.0,
"r_x3": 396.2,
"r_y3": 114.0,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 97.4,
"r_y0": 146.2,
"r_x1": 105.1,
"r_y1": 146.2,
"r_x2": 105.1,
"r_y2": 141.3,
"r_x3": 97.4,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Val",
"orig": "Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.9,
"r_y0": 90.7,
"r_x1": 76.2,
"r_y1": 90.7,
"r_x2": 76.2,
"r_y2": 85.7,
"r_x3": 60.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.3,
"r_y0": 91.2,
"r_x1": 107.0,
"r_y1": 91.2,
"r_x2": 107.0,
"r_y2": 86.2,
"r_x3": 82.3,
"r_y3": 86.2,
"coord_origin": "TOPLEFT"
},
"text": "500K 10K",
"orig": "500K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.2,
"r_y0": 146.6,
"r_x1": 281.9,
"r_y1": 146.6,
"r_x2": 281.9,
"r_y2": 141.6,
"r_x3": 246.2,
"r_y3": 141.6,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 226.7,
"r_y0": 90.7,
"r_x1": 241.9,
"r_y1": 90.7,
"r_x2": 241.9,
"r_y2": 85.7,
"r_x3": 226.7,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 249.9,
"r_y0": 91.0,
"r_x1": 282.5,
"r_y1": 91.0,
"r_x2": 282.5,
"r_y2": 86.1,
"r_x3": 249.9,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "91K 10K 10K",
"orig": "91K 10K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.2,
"r_y0": 146.2,
"r_x1": 444.7,
"r_y1": 146.2,
"r_x2": 444.7,
"r_y2": 141.3,
"r_x3": 410.2,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.4,
"r_y0": 90.7,
"r_x1": 432.7,
"r_y1": 90.7,
"r_x2": 432.7,
"r_y2": 85.7,
"r_x3": 391.4,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "100% 130K 5K",
"orig": "100% 130K 5K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 435.6,
"r_y0": 91.2,
"r_x1": 445.6,
"r_y1": 91.2,
"r_x2": 445.6,
"r_y2": 86.3,
"r_x3": 435.6,
"r_y3": 86.3,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.9,
"r_y0": 146.2,
"r_x1": 136.2,
"r_y1": 146.2,
"r_x2": 136.2,
"r_y2": 141.3,
"r_x3": 113.9,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.9,
"r_y0": 99.8,
"r_x1": 127.1,
"r_y1": 99.8,
"r_x2": 127.1,
"r_y2": 94.8,
"r_x3": 116.9,
"r_y3": 94.8,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.3,
"r_y0": 105.9,
"r_x1": 127.1,
"r_y1": 105.9,
"r_x2": 127.1,
"r_y2": 100.9,
"r_x3": 113.3,
"r_y3": 100.9,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.9,
"r_y0": 112.0,
"r_x1": 127.1,
"r_y1": 112.0,
"r_x2": 127.1,
"r_y2": 107.1,
"r_x3": 112.9,
"r_y3": 107.1,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.2,
"r_y0": 127.6,
"r_x1": 127.0,
"r_y1": 127.6,
"r_x2": 127.0,
"r_y2": 122.6,
"r_x3": 113.2,
"r_y3": 122.6,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.9,
"r_y0": 133.7,
"r_x1": 127.0,
"r_y1": 133.7,
"r_x2": 127.0,
"r_y2": 128.7,
"r_x3": 112.9,
"r_y3": 128.7,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.6,
"r_y0": 146.4,
"r_x1": 156.0,
"r_y1": 146.4,
"r_x2": 156.0,
"r_y2": 141.4,
"r_x3": 138.6,
"r_y3": 141.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.0,
"r_y0": 91.2,
"r_x1": 151.0,
"r_y1": 91.2,
"r_x2": 151.0,
"r_y2": 86.3,
"r_x3": 122.0,
"r_y3": 86.3,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.7,
"r_y0": 91.5,
"r_x1": 321.7,
"r_y1": 91.5,
"r_x2": 321.7,
"r_y2": 86.6,
"r_x3": 311.7,
"r_y3": 86.6,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 287.9,
"r_y0": 146.7,
"r_x1": 310.1,
"r_y1": 146.7,
"r_x2": 310.1,
"r_y2": 141.7,
"r_x3": 287.9,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.2,
"r_y0": 98.0,
"r_x1": 299.4,
"r_y1": 98.0,
"r_x2": 299.4,
"r_y2": 93.1,
"r_x3": 289.2,
"r_y3": 93.1,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.6,
"r_y0": 104.2,
"r_x1": 299.4,
"r_y1": 104.2,
"r_x2": 299.4,
"r_y2": 99.2,
"r_x3": 285.6,
"r_y3": 99.2,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.3,
"r_y0": 110.3,
"r_x1": 299.4,
"r_y1": 110.3,
"r_x2": 299.4,
"r_y2": 105.3,
"r_x3": 285.3,
"r_y3": 105.3,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.4,
"r_y0": 125.3,
"r_x1": 299.2,
"r_y1": 125.3,
"r_x2": 299.2,
"r_y2": 120.4,
"r_x3": 285.4,
"r_y3": 120.4,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.1,
"r_y0": 131.5,
"r_x1": 299.2,
"r_y1": 131.5,
"r_x2": 299.2,
"r_y2": 126.5,
"r_x3": 285.1,
"r_y3": 126.5,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.3,
"r_y0": 146.7,
"r_x1": 328.8,
"r_y1": 146.7,
"r_x2": 328.8,
"r_y2": 141.7,
"r_x3": 311.3,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 299.6,
"r_y0": 91.7,
"r_x1": 309.6,
"r_y1": 91.7,
"r_x2": 309.6,
"r_y2": 86.7,
"r_x3": 299.6,
"r_y3": 86.7,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.0,
"r_y0": 146.6,
"r_x1": 483.5,
"r_y1": 146.6,
"r_x2": 483.5,
"r_y2": 141.7,
"r_x3": 466.0,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.0,
"r_y0": 98.7,
"r_x1": 469.2,
"r_y1": 98.7,
"r_x2": 469.2,
"r_y2": 93.8,
"r_x3": 459.0,
"r_y3": 93.8,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.4,
"r_y0": 104.8,
"r_x1": 469.2,
"r_y1": 104.8,
"r_x2": 469.2,
"r_y2": 99.9,
"r_x3": 455.4,
"r_y3": 99.9,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.0,
"r_y0": 111.0,
"r_x1": 469.2,
"r_y1": 111.0,
"r_x2": 469.2,
"r_y2": 106.0,
"r_x3": 455.0,
"r_y3": 106.0,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 467.4,
"r_y0": 90.5,
"r_x1": 480.7,
"r_y1": 90.5,
"r_x2": 480.7,
"r_y2": 85.6,
"r_x3": 467.4,
"r_y3": 85.6,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.4,
"r_y0": 146.5,
"r_x1": 182.6,
"r_y1": 146.5,
"r_x2": 182.6,
"r_y2": 141.6,
"r_x3": 160.4,
"r_y3": 141.6,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 153.7,
"r_y0": 99.8,
"r_x1": 173.3,
"r_y1": 99.8,
"r_x2": 173.3,
"r_y2": 94.9,
"r_x3": 153.7,
"r_y3": 94.9,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 154.5,
"r_y0": 105.9,
"r_x1": 173.3,
"r_y1": 105.9,
"r_x2": 173.3,
"r_y2": 101.0,
"r_x3": 154.5,
"r_y3": 101.0,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 155.3,
"r_y0": 112.1,
"r_x1": 173.3,
"r_y1": 112.1,
"r_x2": 173.3,
"r_y2": 107.1,
"r_x3": 155.3,
"r_y3": 107.1,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.4,
"r_y0": 112.2,
"r_x1": 346.0,
"r_y1": 112.2,
"r_x2": 346.0,
"r_y2": 107.2,
"r_x3": 326.4,
"r_y3": 107.2,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.2,
"r_y0": 118.3,
"r_x1": 346.0,
"r_y1": 118.3,
"r_x2": 346.0,
"r_y2": 113.4,
"r_x3": 327.2,
"r_y3": 113.4,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.9,
"r_y0": 124.4,
"r_x1": 346.0,
"r_y1": 124.4,
"r_x2": 346.0,
"r_y2": 119.5,
"r_x3": 327.9,
"r_y3": 119.5,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.0,
"r_y0": 109.1,
"r_x1": 508.8,
"r_y1": 109.1,
"r_x2": 508.8,
"r_y2": 104.2,
"r_x3": 489.0,
"r_y3": 104.2,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.2,
"r_y0": 115.2,
"r_x1": 508.8,
"r_y1": 115.2,
"r_x2": 508.8,
"r_y2": 110.3,
"r_x3": 490.2,
"r_y3": 110.3,
"coord_origin": "TOPLEFT"
},
"text": "doesn't",
"orig": "doesn't",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.7,
"r_y0": 121.4,
"r_x1": 508.8,
"r_y1": 121.4,
"r_x2": 508.8,
"r_y2": 116.4,
"r_x3": 489.7,
"r_y3": 116.4,
"coord_origin": "TOPLEFT"
},
"text": "provide",
"orig": "provide",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.7,
"r_y0": 127.5,
"r_x1": 508.8,
"r_y1": 127.5,
"r_x2": 508.8,
"r_y2": 122.5,
"r_x3": 490.7,
"r_y3": 122.5,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.4,
"r_y0": 146.7,
"r_x1": 202.8,
"r_y1": 146.7,
"r_x2": 202.8,
"r_y2": 141.7,
"r_x3": 185.4,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 168.5,
"r_y0": 91.1,
"r_x1": 197.5,
"r_y1": 91.1,
"r_x2": 197.5,
"r_y2": 86.1,
"r_x3": 168.5,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.4,
"r_y0": 91.0,
"r_x1": 367.4,
"r_y1": 91.0,
"r_x2": 367.4,
"r_y2": 86.0,
"r_x3": 357.4,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.7,
"r_y0": 146.6,
"r_x1": 374.9,
"r_y1": 146.6,
"r_x2": 374.9,
"r_y2": 141.6,
"r_x3": 333.7,
"r_y3": 141.6,
"coord_origin": "TOPLEFT"
},
"text": "Complex Simple",
"orig": "Complex Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.7,
"r_y0": 91.0,
"r_x1": 355.7,
"r_y1": 91.0,
"r_x2": 355.7,
"r_y2": 86.1,
"r_x3": 345.7,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.5,
"r_y0": 146.3,
"r_x1": 526.0,
"r_y1": 146.3,
"r_x2": 526.0,
"r_y2": 141.4,
"r_x3": 508.5,
"r_y3": 141.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 510.4,
"r_y0": 91.0,
"r_x1": 523.7,
"r_y1": 91.0,
"r_x2": 523.7,
"r_y2": 86.1,
"r_x3": 510.4,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 46,
"label": "text",
"bbox": {
"l": 119.4,
"t": 77.3,
"r": 151.9,
"b": 83.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.4,
"r_y0": 83.3,
"r_x1": 151.9,
"r_y1": 83.3,
"r_x2": 151.9,
"r_y2": 77.3,
"r_x3": 119.4,
"r_y3": 77.3,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 53.3,
"t": 75.2,
"r": 59.3,
"b": 81.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.3,
"r_y0": 81.1,
"r_x1": 59.3,
"r_y1": 81.1,
"r_x2": 59.3,
"r_y2": 75.2,
"r_x3": 53.3,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 289.6,
"t": 77.5,
"r": 319.8,
"b": 83.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.6,
"r_y0": 83.4,
"r_x1": 319.8,
"r_y1": 83.4,
"r_x2": 319.8,
"r_y2": 77.5,
"r_x3": 289.6,
"r_y3": 77.5,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 448.4,
"t": 77.3,
"r": 481.8,
"b": 83.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.4,
"r_y0": 83.2,
"r_x1": 481.8,
"r_y1": 83.2,
"r_x2": 481.8,
"r_y2": 77.3,
"r_x3": 448.4,
"r_y3": 77.3,
"coord_origin": "TOPLEFT"
},
"text": "Table Bank",
"orig": "Table Bank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 82.6,
"t": 141.3,
"r": 95.0,
"b": 146.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.6,
"r_y0": 146.2,
"r_x1": 95.0,
"r_y1": 146.2,
"r_x2": 95.0,
"r_y2": 141.3,
"r_x3": 82.6,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Train",
"orig": "Train",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 51,
"label": "text",
"bbox": {
"l": 63.0,
"t": 101.1,
"r": 85.3,
"b": 106.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 63.0,
"r_y0": 106.1,
"r_x1": 85.3,
"r_y1": 106.1,
"r_x2": 85.3,
"r_y2": 101.1,
"r_x3": 63.0,
"r_y3": 101.1,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 52,
"label": "text",
"bbox": {
"l": 67.8,
"t": 124.4,
"r": 85.2,
"b": 129.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 129.4,
"r_x1": 85.2,
"r_y1": 129.4,
"r_x2": 85.2,
"r_y2": 124.4,
"r_x3": 67.8,
"r_y3": 124.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 53,
"label": "text",
"bbox": {
"l": 227.6,
"t": 102.5,
"r": 249.8,
"b": 107.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.6,
"r_y0": 107.5,
"r_x1": 249.8,
"r_y1": 107.5,
"r_x2": 249.8,
"r_y2": 102.5,
"r_x3": 227.6,
"r_y3": 102.5,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 54,
"label": "text",
"bbox": {
"l": 232.2,
"t": 127.0,
"r": 249.7,
"b": 131.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.2,
"r_y0": 131.9,
"r_x1": 249.7,
"r_y1": 131.9,
"r_x2": 249.7,
"r_y2": 127.0,
"r_x3": 232.2,
"r_y3": 127.0,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 55,
"label": "text",
"bbox": {
"l": 396.2,
"t": 114.0,
"r": 413.7,
"b": 119.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 119.0,
"r_x1": 413.7,
"r_y1": 119.0,
"r_x2": 413.7,
"r_y2": 114.0,
"r_x3": 396.2,
"r_y3": 114.0,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 97.4,
"t": 141.3,
"r": 105.1,
"b": 146.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 97.4,
"r_y0": 146.2,
"r_x1": 105.1,
"r_y1": 146.2,
"r_x2": 105.1,
"r_y2": 141.3,
"r_x3": 97.4,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Val",
"orig": "Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 60.9,
"t": 85.7,
"r": 76.2,
"b": 90.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.9,
"r_y0": 90.7,
"r_x1": 76.2,
"r_y1": 90.7,
"r_x2": 76.2,
"r_y2": 85.7,
"r_x3": 60.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 82.3,
"t": 86.2,
"r": 107.0,
"b": 91.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.3,
"r_y0": 91.2,
"r_x1": 107.0,
"r_y1": 91.2,
"r_x2": 107.0,
"r_y2": 86.2,
"r_x3": 82.3,
"r_y3": 86.2,
"coord_origin": "TOPLEFT"
},
"text": "500K 10K",
"orig": "500K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 246.2,
"t": 141.6,
"r": 281.9,
"b": 146.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.2,
"r_y0": 146.6,
"r_x1": 281.9,
"r_y1": 146.6,
"r_x2": 281.9,
"r_y2": 141.6,
"r_x3": 246.2,
"r_y3": 141.6,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 226.7,
"t": 85.7,
"r": 241.9,
"b": 90.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 226.7,
"r_y0": 90.7,
"r_x1": 241.9,
"r_y1": 90.7,
"r_x2": 241.9,
"r_y2": 85.7,
"r_x3": 226.7,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 249.9,
"t": 86.1,
"r": 282.5,
"b": 91.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 249.9,
"r_y0": 91.0,
"r_x1": 282.5,
"r_y1": 91.0,
"r_x2": 282.5,
"r_y2": 86.1,
"r_x3": 249.9,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "91K 10K 10K",
"orig": "91K 10K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 410.2,
"t": 141.3,
"r": 444.7,
"b": 146.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.2,
"r_y0": 146.2,
"r_x1": 444.7,
"r_y1": 146.2,
"r_x2": 444.7,
"r_y2": 141.3,
"r_x3": 410.2,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 391.4,
"t": 85.7,
"r": 432.7,
"b": 90.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.4,
"r_y0": 90.7,
"r_x1": 432.7,
"r_y1": 90.7,
"r_x2": 432.7,
"r_y2": 85.7,
"r_x3": 391.4,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "100% 130K 5K",
"orig": "100% 130K 5K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 435.6,
"t": 86.3,
"r": 445.6,
"b": 91.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 435.6,
"r_y0": 91.2,
"r_x1": 445.6,
"r_y1": 91.2,
"r_x2": 445.6,
"r_y2": 86.3,
"r_x3": 435.6,
"r_y3": 86.3,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 113.9,
"t": 141.3,
"r": 136.2,
"b": 146.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.9,
"r_y0": 146.2,
"r_x1": 136.2,
"r_y1": 146.2,
"r_x2": 136.2,
"r_y2": 141.3,
"r_x3": 113.9,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 116.9,
"t": 94.8,
"r": 127.1,
"b": 99.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.9,
"r_y0": 99.8,
"r_x1": 127.1,
"r_y1": 99.8,
"r_x2": 127.1,
"r_y2": 94.8,
"r_x3": 116.9,
"r_y3": 94.8,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 113.3,
"t": 100.9,
"r": 127.1,
"b": 105.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.3,
"r_y0": 105.9,
"r_x1": 127.1,
"r_y1": 105.9,
"r_x2": 127.1,
"r_y2": 100.9,
"r_x3": 113.3,
"r_y3": 100.9,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 112.9,
"t": 107.1,
"r": 127.1,
"b": 112.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.9,
"r_y0": 112.0,
"r_x1": 127.1,
"r_y1": 112.0,
"r_x2": 127.1,
"r_y2": 107.1,
"r_x3": 112.9,
"r_y3": 107.1,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 113.2,
"t": 122.6,
"r": 127.0,
"b": 127.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.2,
"r_y0": 127.6,
"r_x1": 127.0,
"r_y1": 127.6,
"r_x2": 127.0,
"r_y2": 122.6,
"r_x3": 113.2,
"r_y3": 122.6,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 112.9,
"t": 128.7,
"r": 127.0,
"b": 133.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.9,
"r_y0": 133.7,
"r_x1": 127.0,
"r_y1": 133.7,
"r_x2": 127.0,
"r_y2": 128.7,
"r_x3": 112.9,
"r_y3": 128.7,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 138.6,
"t": 141.4,
"r": 156.0,
"b": 146.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.6,
"r_y0": 146.4,
"r_x1": 156.0,
"r_y1": 146.4,
"r_x2": 156.0,
"r_y2": 141.4,
"r_x3": 138.6,
"r_y3": 141.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 122.0,
"t": 86.3,
"r": 151.0,
"b": 91.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.0,
"r_y0": 91.2,
"r_x1": 151.0,
"r_y1": 91.2,
"r_x2": 151.0,
"r_y2": 86.3,
"r_x3": 122.0,
"r_y3": 86.3,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 311.7,
"t": 86.6,
"r": 321.7,
"b": 91.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.7,
"r_y0": 91.5,
"r_x1": 321.7,
"r_y1": 91.5,
"r_x2": 321.7,
"r_y2": 86.6,
"r_x3": 311.7,
"r_y3": 86.6,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 287.9,
"t": 141.7,
"r": 310.1,
"b": 146.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 287.9,
"r_y0": 146.7,
"r_x1": 310.1,
"r_y1": 146.7,
"r_x2": 310.1,
"r_y2": 141.7,
"r_x3": 287.9,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 289.2,
"t": 93.1,
"r": 299.4,
"b": 98.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.2,
"r_y0": 98.0,
"r_x1": 299.4,
"r_y1": 98.0,
"r_x2": 299.4,
"r_y2": 93.1,
"r_x3": 289.2,
"r_y3": 93.1,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 285.6,
"t": 99.2,
"r": 299.4,
"b": 104.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.6,
"r_y0": 104.2,
"r_x1": 299.4,
"r_y1": 104.2,
"r_x2": 299.4,
"r_y2": 99.2,
"r_x3": 285.6,
"r_y3": 99.2,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 285.3,
"t": 105.3,
"r": 299.4,
"b": 110.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.3,
"r_y0": 110.3,
"r_x1": 299.4,
"r_y1": 110.3,
"r_x2": 299.4,
"r_y2": 105.3,
"r_x3": 285.3,
"r_y3": 105.3,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 285.4,
"t": 120.4,
"r": 299.2,
"b": 125.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.4,
"r_y0": 125.3,
"r_x1": 299.2,
"r_y1": 125.3,
"r_x2": 299.2,
"r_y2": 120.4,
"r_x3": 285.4,
"r_y3": 120.4,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 285.1,
"t": 126.5,
"r": 299.2,
"b": 131.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.1,
"r_y0": 131.5,
"r_x1": 299.2,
"r_y1": 131.5,
"r_x2": 299.2,
"r_y2": 126.5,
"r_x3": 285.1,
"r_y3": 126.5,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 311.3,
"t": 141.7,
"r": 328.8,
"b": 146.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.3,
"r_y0": 146.7,
"r_x1": 328.8,
"r_y1": 146.7,
"r_x2": 328.8,
"r_y2": 141.7,
"r_x3": 311.3,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 299.6,
"t": 86.7,
"r": 309.6,
"b": 91.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 299.6,
"r_y0": 91.7,
"r_x1": 309.6,
"r_y1": 91.7,
"r_x2": 309.6,
"r_y2": 86.7,
"r_x3": 299.6,
"r_y3": 86.7,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 466.0,
"t": 141.7,
"r": 483.5,
"b": 146.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.0,
"r_y0": 146.6,
"r_x1": 483.5,
"r_y1": 146.6,
"r_x2": 483.5,
"r_y2": 141.7,
"r_x3": 466.0,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 83,
"label": "text",
"bbox": {
"l": 459.0,
"t": 93.8,
"r": 469.2,
"b": 98.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.0,
"r_y0": 98.7,
"r_x1": 469.2,
"r_y1": 98.7,
"r_x2": 469.2,
"r_y2": 93.8,
"r_x3": 459.0,
"r_y3": 93.8,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 455.4,
"t": 99.9,
"r": 469.2,
"b": 104.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.4,
"r_y0": 104.8,
"r_x1": 469.2,
"r_y1": 104.8,
"r_x2": 469.2,
"r_y2": 99.9,
"r_x3": 455.4,
"r_y3": 99.9,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 455.0,
"t": 106.0,
"r": 469.2,
"b": 111.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.0,
"r_y0": 111.0,
"r_x1": 469.2,
"r_y1": 111.0,
"r_x2": 469.2,
"r_y2": 106.0,
"r_x3": 455.0,
"r_y3": 106.0,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 467.4,
"t": 85.6,
"r": 480.7,
"b": 90.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 467.4,
"r_y0": 90.5,
"r_x1": 480.7,
"r_y1": 90.5,
"r_x2": 480.7,
"r_y2": 85.6,
"r_x3": 467.4,
"r_y3": 85.6,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 160.4,
"t": 141.6,
"r": 182.6,
"b": 146.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.4,
"r_y0": 146.5,
"r_x1": 182.6,
"r_y1": 146.5,
"r_x2": 182.6,
"r_y2": 141.6,
"r_x3": 160.4,
"r_y3": 141.6,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 153.7,
"t": 94.9,
"r": 173.3,
"b": 99.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 153.7,
"r_y0": 99.8,
"r_x1": 173.3,
"r_y1": 99.8,
"r_x2": 173.3,
"r_y2": 94.9,
"r_x3": 153.7,
"r_y3": 94.9,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 154.5,
"t": 101.0,
"r": 173.3,
"b": 105.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 154.5,
"r_y0": 105.9,
"r_x1": 173.3,
"r_y1": 105.9,
"r_x2": 173.3,
"r_y2": 101.0,
"r_x3": 154.5,
"r_y3": 101.0,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 155.3,
"t": 107.1,
"r": 173.3,
"b": 112.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 155.3,
"r_y0": 112.1,
"r_x1": 173.3,
"r_y1": 112.1,
"r_x2": 173.3,
"r_y2": 107.1,
"r_x3": 155.3,
"r_y3": 107.1,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 326.4,
"t": 107.2,
"r": 346.0,
"b": 112.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.4,
"r_y0": 112.2,
"r_x1": 346.0,
"r_y1": 112.2,
"r_x2": 346.0,
"r_y2": 107.2,
"r_x3": 326.4,
"r_y3": 107.2,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 327.2,
"t": 113.4,
"r": 346.0,
"b": 118.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.2,
"r_y0": 118.3,
"r_x1": 346.0,
"r_y1": 118.3,
"r_x2": 346.0,
"r_y2": 113.4,
"r_x3": 327.2,
"r_y3": 113.4,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 327.9,
"t": 119.5,
"r": 346.0,
"b": 124.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.9,
"r_y0": 124.4,
"r_x1": 346.0,
"r_y1": 124.4,
"r_x2": 346.0,
"r_y2": 119.5,
"r_x3": 327.9,
"r_y3": 119.5,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 489.0,
"t": 104.2,
"r": 508.8,
"b": 109.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.0,
"r_y0": 109.1,
"r_x1": 508.8,
"r_y1": 109.1,
"r_x2": 508.8,
"r_y2": 104.2,
"r_x3": 489.0,
"r_y3": 104.2,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 490.2,
"t": 110.3,
"r": 508.8,
"b": 115.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.2,
"r_y0": 115.2,
"r_x1": 508.8,
"r_y1": 115.2,
"r_x2": 508.8,
"r_y2": 110.3,
"r_x3": 490.2,
"r_y3": 110.3,
"coord_origin": "TOPLEFT"
},
"text": "doesn't",
"orig": "doesn't",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 489.7,
"t": 116.4,
"r": 508.8,
"b": 121.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.7,
"r_y0": 121.4,
"r_x1": 508.8,
"r_y1": 121.4,
"r_x2": 508.8,
"r_y2": 116.4,
"r_x3": 489.7,
"r_y3": 116.4,
"coord_origin": "TOPLEFT"
},
"text": "provide",
"orig": "provide",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 490.7,
"t": 122.5,
"r": 508.8,
"b": 127.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.7,
"r_y0": 127.5,
"r_x1": 508.8,
"r_y1": 127.5,
"r_x2": 508.8,
"r_y2": 122.5,
"r_x3": 490.7,
"r_y3": 122.5,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 185.4,
"t": 141.7,
"r": 202.8,
"b": 146.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.4,
"r_y0": 146.7,
"r_x1": 202.8,
"r_y1": 146.7,
"r_x2": 202.8,
"r_y2": 141.7,
"r_x3": 185.4,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 99,
"label": "text",
"bbox": {
"l": 168.5,
"t": 86.1,
"r": 197.5,
"b": 91.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 168.5,
"r_y0": 91.1,
"r_x1": 197.5,
"r_y1": 91.1,
"r_x2": 197.5,
"r_y2": 86.1,
"r_x3": 168.5,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 357.4,
"t": 86.0,
"r": 367.4,
"b": 91.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.4,
"r_y0": 91.0,
"r_x1": 367.4,
"r_y1": 91.0,
"r_x2": 367.4,
"r_y2": 86.0,
"r_x3": 357.4,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 333.7,
"t": 141.6,
"r": 374.9,
"b": 146.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.7,
"r_y0": 146.6,
"r_x1": 374.9,
"r_y1": 146.6,
"r_x2": 374.9,
"r_y2": 141.6,
"r_x3": 333.7,
"r_y3": 141.6,
"coord_origin": "TOPLEFT"
},
"text": "Complex Simple",
"orig": "Complex Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 345.7,
"t": 86.1,
"r": 355.7,
"b": 91.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.7,
"r_y0": 91.0,
"r_x1": 355.7,
"r_y1": 91.0,
"r_x2": 355.7,
"r_y2": 86.1,
"r_x3": 345.7,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 508.5,
"t": 141.4,
"r": 526.0,
"b": 146.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.5,
"r_y0": 146.3,
"r_x1": 526.0,
"r_y1": 146.3,
"r_x2": 526.0,
"r_y2": 141.4,
"r_x3": 508.5,
"r_y3": 141.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 510.4,
"t": 86.1,
"r": 523.7,
"b": 91.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 510.4,
"r_y0": 91.0,
"r_x1": 523.7,
"r_y1": 91.0,
"r_x2": 523.7,
"r_y2": 86.1,
"r_x3": 510.4,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
{
"id": 1,
"label": "caption",
"bbox": {
"l": 50.1,
"t": 165.5,
"r": 545.1,
"b": 186.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 174.4,
"r_x1": 545.1,
"r_y1": 174.4,
"r_x2": 545.1,
"r_y2": 165.5,
"r_x3": 50.1,
"r_y3": 165.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,",
"orig": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 186.4,
"r_x1": 513.5,
"r_y1": 186.4,
"r_x2": 513.5,
"r_y2": 177.5,
"r_x3": 50.1,
"r_y3": 177.5,
"coord_origin": "TOPLEFT"
},
"text": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.",
"orig": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "list_item",
"bbox": {
"l": 61.6,
"t": 210.9,
"r": 286.4,
"b": 231.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 219.8,
"r_x1": 71.1,
"r_y1": 219.8,
"r_x2": 71.1,
"r_y2": 210.9,
"r_x3": 61.6,
"r_y3": 210.9,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.5,
"r_y0": 219.8,
"r_x1": 286.4,
"r_y1": 219.8,
"r_x2": 286.4,
"r_y2": 210.9,
"r_x3": 73.5,
"r_y3": 210.9,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer output does not include the table cell con-",
"orig": "TableFormer output does not include the table cell con-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 231.8,
"r_x1": 87.5,
"r_y1": 231.8,
"r_x2": 87.5,
"r_y2": 222.9,
"r_x3": 70.0,
"r_y3": 222.9,
"coord_origin": "TOPLEFT"
},
"text": "tent.",
"orig": "tent.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "list_item",
"bbox": {
"l": 61.6,
"t": 244.1,
"r": 286.4,
"b": 264.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 253.0,
"r_x1": 71.3,
"r_y1": 253.0,
"r_x2": 71.3,
"r_y2": 244.1,
"r_x3": 61.6,
"r_y3": 244.1,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.8,
"r_y0": 253.0,
"r_x1": 286.4,
"r_y1": 253.0,
"r_x2": 286.4,
"r_y2": 244.1,
"r_x3": 73.8,
"r_y3": 244.1,
"coord_origin": "TOPLEFT"
},
"text": "There are occasional inaccuracies in the predictions of",
"orig": "There are occasional inaccuracies in the predictions of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 264.9,
"r_x1": 150.4,
"r_y1": 264.9,
"r_x2": 150.4,
"r_y2": 256.0,
"r_x3": 70.0,
"r_y3": 256.0,
"coord_origin": "TOPLEFT"
},
"text": "the bounding boxes.",
"orig": "the bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 0,
"label": "text",
"bbox": {
"l": 50.1,
"t": 279.2,
"r": 286.4,
"b": 395.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 288.1,
"r_x1": 286.4,
"r_y1": 288.1,
"r_x2": 286.4,
"r_y2": 279.2,
"r_x3": 62.1,
"r_y3": 279.2,
"coord_origin": "TOPLEFT"
},
"text": "However, it is possible to mitigate those limitations by",
"orig": "However, it is possible to mitigate those limitations by",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 300.1,
"r_x1": 286.4,
"r_y1": 300.1,
"r_x2": 286.4,
"r_y2": 291.2,
"r_x3": 50.1,
"r_y3": 291.2,
"coord_origin": "TOPLEFT"
},
"text": "combining the TableFormer predictions with the informa-",
"orig": "combining the TableFormer predictions with the informa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 312.0,
"r_x1": 286.4,
"r_y1": 312.0,
"r_x2": 286.4,
"r_y2": 303.1,
"r_x3": 50.1,
"r_y3": 303.1,
"coord_origin": "TOPLEFT"
},
"text": "tion already present inside a programmatic PDF document.",
"orig": "tion already present inside a programmatic PDF document.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 324.0,
"r_x1": 286.4,
"r_y1": 324.0,
"r_x2": 286.4,
"r_y2": 315.1,
"r_x3": 50.1,
"r_y3": 315.1,
"coord_origin": "TOPLEFT"
},
"text": "More specifically, PDF documents can be seen as a se-",
"orig": "More specifically, PDF documents can be seen as a se-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 335.9,
"r_x1": 286.4,
"r_y1": 335.9,
"r_x2": 286.4,
"r_y2": 327.0,
"r_x3": 50.1,
"r_y3": 327.0,
"coord_origin": "TOPLEFT"
},
"text": "quence of PDF cells where each cell is described by its con-",
"orig": "quence of PDF cells where each cell is described by its con-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 347.9,
"r_x1": 286.4,
"r_y1": 347.9,
"r_x2": 286.4,
"r_y2": 339.0,
"r_x3": 50.1,
"r_y3": 339.0,
"coord_origin": "TOPLEFT"
},
"text": "tent and bounding box. If we are able to associate the PDF",
"orig": "tent and bounding box. If we are able to associate the PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 359.8,
"r_x1": 286.4,
"r_y1": 359.8,
"r_x2": 286.4,
"r_y2": 350.9,
"r_x3": 50.1,
"r_y3": 350.9,
"coord_origin": "TOPLEFT"
},
"text": "cells with the predicted table cells, we can directly link the",
"orig": "cells with the predicted table cells, we can directly link the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 371.8,
"r_x1": 286.4,
"r_y1": 371.8,
"r_x2": 286.4,
"r_y2": 362.9,
"r_x3": 50.1,
"r_y3": 362.9,
"coord_origin": "TOPLEFT"
},
"text": "PDF cell content to the table cell structure and use the PDF",
"orig": "PDF cell content to the table cell structure and use the PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 383.8,
"r_x1": 286.4,
"r_y1": 383.8,
"r_x2": 286.4,
"r_y2": 374.8,
"r_x3": 50.1,
"r_y3": 374.8,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes to correct misalignments in the predicted",
"orig": "bounding boxes to correct misalignments in the predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 395.7,
"r_x1": 154.6,
"r_y1": 395.7,
"r_x2": 154.6,
"r_y2": 386.8,
"r_x3": 50.1,
"r_y3": 386.8,
"coord_origin": "TOPLEFT"
},
"text": "table cell bounding boxes.",
"orig": "table cell bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 11,
"label": "text",
"bbox": {
"l": 50.1,
"t": 399.1,
"r": 286.4,
"b": 419.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 408.0,
"r_x1": 286.4,
"r_y1": 408.0,
"r_x2": 286.4,
"r_y2": 399.1,
"r_x3": 62.1,
"r_y3": 399.1,
"coord_origin": "TOPLEFT"
},
"text": "Here is a step-by-step description of the prediction post-",
"orig": "Here is a step-by-step description of the prediction post-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 419.9,
"r_x1": 95.5,
"r_y1": 419.9,
"r_x2": 95.5,
"r_y2": 411.0,
"r_x3": 50.1,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "processing:",
"orig": "processing:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 20,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 423.3,
"r": 286.4,
"b": 456.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.83,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 432.2,
"r_x1": 69.4,
"r_y1": 432.2,
"r_x2": 69.4,
"r_y2": 423.3,
"r_x3": 62.1,
"r_y3": 423.3,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.8,
"r_y0": 432.2,
"r_x1": 286.4,
"r_y1": 432.2,
"r_x2": 286.4,
"r_y2": 423.3,
"r_x3": 71.8,
"r_y3": 423.3,
"coord_origin": "TOPLEFT"
},
"text": "Get the minimal grid dimensions - number of rows and",
"orig": "Get the minimal grid dimensions - number of rows and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 444.2,
"r_x1": 286.4,
"r_y1": 444.2,
"r_x2": 286.4,
"r_y2": 435.3,
"r_x3": 50.1,
"r_y3": 435.3,
"coord_origin": "TOPLEFT"
},
"text": "columns for the predicted table structure. This represents",
"orig": "columns for the predicted table structure. This represents",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 456.1,
"r_x1": 274.5,
"r_y1": 456.1,
"r_x2": 274.5,
"r_y2": 447.2,
"r_x3": 50.1,
"r_y3": 447.2,
"coord_origin": "TOPLEFT"
},
"text": "the most granular grid for the underlying table structure.",
"orig": "the most granular grid for the underlying table structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 459.5,
"r": 286.4,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 468.4,
"r_x1": 69.5,
"r_y1": 468.4,
"r_x2": 69.5,
"r_y2": 459.5,
"r_x3": 62.1,
"r_y3": 459.5,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 77.4,
"r_y0": 468.4,
"r_x1": 286.4,
"r_y1": 468.4,
"r_x2": 286.4,
"r_y2": 459.5,
"r_x3": 77.4,
"r_y3": 459.5,
"coord_origin": "TOPLEFT"
},
"text": "Generate pair-wise matches between the bounding",
"orig": "Generate pair-wise matches between the bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 480.3,
"r_x1": 286.4,
"r_y1": 480.3,
"r_x2": 286.4,
"r_y2": 471.4,
"r_x3": 50.1,
"r_y3": 471.4,
"coord_origin": "TOPLEFT"
},
"text": "boxes of the PDF cells and the predicted cells. The Intersec-",
"orig": "boxes of the PDF cells and the predicted cells. The Intersec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 492.3,
"r_x1": 286.4,
"r_y1": 492.3,
"r_x2": 286.4,
"r_y2": 483.4,
"r_x3": 50.1,
"r_y3": 483.4,
"coord_origin": "TOPLEFT"
},
"text": "tion Over Union (IOU) metric is used to evaluate the quality",
"orig": "tion Over Union (IOU) metric is used to evaluate the quality",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 504.2,
"r_x1": 110.7,
"r_y1": 504.2,
"r_x2": 110.7,
"r_y2": 495.3,
"r_x3": 50.1,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "of the matches.",
"orig": "of the matches.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 10,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 507.6,
"r": 286.4,
"b": 528.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 516.5,
"r_x1": 69.9,
"r_y1": 516.5,
"r_x2": 69.9,
"r_y2": 507.6,
"r_x3": 62.1,
"r_y3": 507.6,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 72.5,
"r_y0": 516.5,
"r_x1": 286.4,
"r_y1": 516.5,
"r_x2": 286.4,
"r_y2": 507.6,
"r_x3": 72.5,
"r_y3": 507.6,
"coord_origin": "TOPLEFT"
},
"text": "Use a carefully selected IOU threshold to designate",
"orig": "Use a carefully selected IOU threshold to designate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 528.5,
"r_x1": 226.1,
"r_y1": 528.5,
"r_x2": 226.1,
"r_y2": 519.6,
"r_x3": 50.1,
"r_y3": 519.6,
"coord_origin": "TOPLEFT"
},
"text": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.",
"orig": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 8,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 531.8,
"r": 286.4,
"b": 564.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 540.7,
"r_x1": 286.4,
"r_y1": 540.7,
"r_x2": 286.4,
"r_y2": 531.8,
"r_x3": 62.1,
"r_y3": 531.8,
"coord_origin": "TOPLEFT"
},
"text": "3.a. If all IOU scores in a column are below the thresh-",
"orig": "3.a. If all IOU scores in a column are below the thresh-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 552.7,
"r_x1": 286.4,
"r_y1": 552.7,
"r_x2": 286.4,
"r_y2": 543.8,
"r_x3": 50.1,
"r_y3": 543.8,
"coord_origin": "TOPLEFT"
},
"text": "old, discard all predictions (structure and bounding boxes)",
"orig": "old, discard all predictions (structure and bounding boxes)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 564.7,
"r_x1": 114.0,
"r_y1": 564.7,
"r_x2": 114.0,
"r_y2": 555.7,
"r_x3": 50.1,
"r_y3": 555.7,
"coord_origin": "TOPLEFT"
},
"text": "for that column.",
"orig": "for that column.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 5,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 568.0,
"r": 286.4,
"b": 600.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 576.9,
"r_x1": 69.5,
"r_y1": 576.9,
"r_x2": 69.5,
"r_y2": 568.0,
"r_x3": 62.1,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.7,
"r_y0": 576.9,
"r_x1": 286.4,
"r_y1": 576.9,
"r_x2": 286.4,
"r_y2": 568.0,
"r_x3": 76.7,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "Find the best-fitting content alignment for the pre-",
"orig": "Find the best-fitting content alignment for the pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 588.9,
"r_x1": 286.4,
"r_y1": 588.9,
"r_x2": 286.4,
"r_y2": 580.0,
"r_x3": 50.1,
"r_y3": 580.0,
"coord_origin": "TOPLEFT"
},
"text": "dicted cells with good IOU per each column. The alignment",
"orig": "dicted cells with good IOU per each column. The alignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 600.8,
"r_x1": 278.7,
"r_y1": 600.8,
"r_x2": 278.7,
"r_y2": 591.9,
"r_x3": 50.1,
"r_y3": 591.9,
"coord_origin": "TOPLEFT"
},
"text": "of the column can be identified by the following formula:",
"orig": "of the column can be identified by the following formula:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 12,
"label": "formula",
"bbox": {
"l": 110.7,
"t": 623.4,
"r": 286.4,
"b": 654.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.0,
"r_y0": 632.8,
"r_x1": 158.0,
"r_y1": 632.8,
"r_x2": 158.0,
"r_y2": 624.0,
"r_x3": 112.0,
"r_y3": 624.0,
"coord_origin": "TOPLEFT"
},
"text": "alignment",
"orig": "alignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.7,
"r_y0": 632.8,
"r_x1": 203.5,
"r_y1": 632.8,
"r_x2": 203.5,
"r_y2": 624.0,
"r_x3": 160.7,
"r_y3": 624.0,
"coord_origin": "TOPLEFT"
},
"text": "= arg min",
"orig": "= arg min",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.6,
"r_y0": 640.2,
"r_x1": 189.1,
"r_y1": 640.2,
"r_x2": 189.1,
"r_y2": 634.0,
"r_x3": 185.6,
"r_y3": 634.0,
"coord_origin": "TOPLEFT"
},
"text": "c",
"orig": "c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 203.5,
"r_y0": 632.8,
"r_x1": 208.5,
"r_y1": 632.8,
"r_x2": 208.5,
"r_y2": 623.4,
"r_x3": 203.5,
"r_y3": 623.4,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.5,
"r_y0": 632.8,
"r_x1": 220.3,
"r_y1": 632.8,
"r_x2": 220.3,
"r_y2": 624.0,
"r_x3": 208.5,
"r_y3": 624.0,
"coord_origin": "TOPLEFT"
},
"text": "D$_{c}$",
"orig": "D$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 632.8,
"r_x1": 225.8,
"r_y1": 632.8,
"r_x2": 225.8,
"r_y2": 623.4,
"r_x3": 220.8,
"r_y3": 623.4,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.7,
"r_y0": 654.1,
"r_x1": 122.5,
"r_y1": 654.1,
"r_x2": 122.5,
"r_y2": 645.3,
"r_x3": 110.7,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "D$_{c}$",
"orig": "D$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.8,
"r_y0": 654.1,
"r_x1": 133.5,
"r_y1": 654.1,
"r_x2": 133.5,
"r_y2": 645.3,
"r_x3": 125.8,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 136.3,
"r_y0": 654.1,
"r_x1": 156.0,
"r_y1": 654.1,
"r_x2": 156.0,
"r_y2": 645.3,
"r_x3": 136.3,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "max",
"orig": "max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 156.0,
"r_y0": 654.1,
"r_x1": 161.0,
"r_y1": 654.1,
"r_x2": 161.0,
"r_y2": 644.7,
"r_x3": 156.0,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 161.0,
"r_y0": 654.1,
"r_x1": 170.2,
"r_y1": 654.1,
"r_x2": 170.2,
"r_y2": 645.3,
"r_x3": 161.0,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 170.7,
"r_y0": 654.1,
"r_x1": 185.7,
"r_y1": 654.1,
"r_x2": 185.7,
"r_y2": 644.7,
"r_x3": 170.7,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "} \u2212",
"orig": "} \u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.9,
"r_y0": 654.1,
"r_x1": 206.1,
"r_y1": 654.1,
"r_x2": 206.1,
"r_y2": 645.3,
"r_x3": 187.9,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "min",
"orig": "min",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.1,
"r_y0": 654.1,
"r_x1": 211.0,
"r_y1": 654.1,
"r_x2": 211.0,
"r_y2": 644.7,
"r_x3": 206.1,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.0,
"r_y0": 654.1,
"r_x1": 220.3,
"r_y1": 654.1,
"r_x2": 220.3,
"r_y2": 645.3,
"r_x3": 211.0,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 654.1,
"r_x1": 225.8,
"r_y1": 654.1,
"r_x2": 225.8,
"r_y2": 644.7,
"r_x3": 220.8,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.7,
"r_y0": 643.8,
"r_x1": 286.4,
"r_y1": 643.8,
"r_x2": 286.4,
"r_y2": 634.9,
"r_x3": 274.7,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "(4)",
"orig": "(4)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 7,
"label": "text",
"bbox": {
"l": 50.1,
"t": 667.3,
"r": 286.4,
"b": 688.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.0,
"r_x1": 74.5,
"r_y1": 677.0,
"r_x2": 74.5,
"r_y2": 668.1,
"r_x3": 50.1,
"r_y3": 668.1,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.3,
"r_y0": 676.8,
"r_x1": 82.6,
"r_y1": 676.8,
"r_x2": 82.6,
"r_y2": 667.9,
"r_x3": 78.3,
"r_y3": 667.9,
"coord_origin": "TOPLEFT"
},
"text": "c",
"orig": "c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.5,
"r_y0": 677.0,
"r_x1": 123.6,
"r_y1": 677.0,
"r_x2": 123.6,
"r_y2": 668.1,
"r_x3": 86.5,
"r_y3": 668.1,
"coord_origin": "TOPLEFT"
},
"text": "is one of",
"orig": "is one of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 127.5,
"r_y0": 676.8,
"r_x1": 132.5,
"r_y1": 676.8,
"r_x2": 132.5,
"r_y2": 667.3,
"r_x3": 127.5,
"r_y3": 667.3,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 132.5,
"r_y0": 677.0,
"r_x1": 210.7,
"r_y1": 677.0,
"r_x2": 210.7,
"r_y2": 668.1,
"r_x3": 132.5,
"r_y3": 668.1,
"coord_origin": "TOPLEFT"
},
"text": "left, centroid, right",
"orig": "left, centroid, right",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.7,
"r_y0": 676.8,
"r_x1": 215.7,
"r_y1": 676.8,
"r_x2": 215.7,
"r_y2": 667.3,
"r_x3": 210.7,
"r_y3": 667.3,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 219.6,
"r_y0": 677.0,
"r_x1": 233.9,
"r_y1": 677.0,
"r_x2": 233.9,
"r_y2": 668.1,
"r_x3": 219.6,
"r_y3": 668.1,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 237.8,
"r_y0": 676.8,
"r_x1": 247.1,
"r_y1": 676.8,
"r_x2": 247.1,
"r_y2": 667.9,
"r_x3": 237.8,
"r_y3": 667.9,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 251.5,
"r_y0": 677.0,
"r_x1": 286.4,
"r_y1": 677.0,
"r_x2": 286.4,
"r_y2": 668.1,
"r_x3": 251.5,
"r_y3": 668.1,
"coord_origin": "TOPLEFT"
},
"text": "is the x-",
"orig": "is the x-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 688.9,
"r_x1": 205.9,
"r_y1": 688.9,
"r_x2": 205.9,
"r_y2": 680.0,
"r_x3": 50.1,
"r_y3": 680.0,
"coord_origin": "TOPLEFT"
},
"text": "coordinate for the corresponding point.",
"orig": "coordinate for the corresponding point.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 13,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 692.3,
"r": 286.4,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 701.2,
"r_x1": 69.5,
"r_y1": 701.2,
"r_x2": 69.5,
"r_y2": 692.3,
"r_x3": 62.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.3,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 76.3,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "Use the alignment computed in step 4, to compute",
"orig": "Use the alignment computed in step 4, to compute",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 94.6,
"r_y1": 713.2,
"r_x2": 94.6,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "the median",
"orig": "the median",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 97.6,
"r_y0": 712.9,
"r_x1": 103.3,
"r_y1": 712.9,
"r_x2": 103.3,
"r_y2": 704.1,
"r_x3": 97.6,
"r_y3": 704.1,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.3,
"r_y0": 713.2,
"r_x1": 286.4,
"r_y1": 713.2,
"r_x2": 286.4,
"r_y2": 704.2,
"r_x3": 103.3,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "-coordinate for all table columns and the me-",
"orig": "-coordinate for all table columns and the me-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 16,
"label": "text",
"bbox": {
"l": 308.9,
"t": 210.9,
"r": 545.1,
"b": 255.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 219.8,
"r_x1": 545.1,
"r_y1": 219.8,
"r_x2": 545.1,
"r_y2": 210.9,
"r_x3": 308.9,
"r_y3": 210.9,
"coord_origin": "TOPLEFT"
},
"text": "dian cell size for all table cells. The usage of median dur-",
"orig": "dian cell size for all table cells. The usage of median dur-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 231.8,
"r_x1": 545.1,
"r_y1": 231.8,
"r_x2": 545.1,
"r_y2": 222.9,
"r_x3": 308.9,
"r_y3": 222.9,
"coord_origin": "TOPLEFT"
},
"text": "ing the computations, helps to eliminate outliers caused by",
"orig": "ing the computations, helps to eliminate outliers caused by",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 243.7,
"r_x1": 545.1,
"r_y1": 243.7,
"r_x2": 545.1,
"r_y2": 234.8,
"r_x3": 308.9,
"r_y3": 234.8,
"coord_origin": "TOPLEFT"
},
"text": "occasional column spans which are usually wider than the",
"orig": "occasional column spans which are usually wider than the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 255.7,
"r_x1": 339.6,
"r_y1": 255.7,
"r_x2": 339.6,
"r_y2": 246.8,
"r_x3": 308.9,
"r_y3": 246.8,
"coord_origin": "TOPLEFT"
},
"text": "normal.",
"orig": "normal.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 9,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 259.1,
"r": 545.1,
"b": 280.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 268.0,
"r_x1": 328.3,
"r_y1": 268.0,
"r_x2": 328.3,
"r_y2": 259.1,
"r_x3": 320.8,
"r_y3": 259.1,
"coord_origin": "TOPLEFT"
},
"text": "6.",
"orig": "6.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 334.9,
"r_y0": 268.0,
"r_x1": 545.1,
"r_y1": 268.0,
"r_x2": 545.1,
"r_y2": 259.1,
"r_x3": 334.9,
"r_y3": 259.1,
"coord_origin": "TOPLEFT"
},
"text": "Snap all cells with bad IOU to their corresponding",
"orig": "Snap all cells with bad IOU to their corresponding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 280.0,
"r_x1": 338.2,
"r_y1": 280.0,
"r_x2": 338.2,
"r_y2": 271.1,
"r_x3": 308.9,
"r_y3": 271.1,
"coord_origin": "TOPLEFT"
},
"text": "median",
"orig": "median",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 340.7,
"r_y0": 279.7,
"r_x1": 346.4,
"r_y1": 279.7,
"r_x2": 346.4,
"r_y2": 270.9,
"r_x3": 340.7,
"r_y3": 270.9,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.4,
"r_y0": 280.0,
"r_x1": 453.7,
"r_y1": 280.0,
"r_x2": 453.7,
"r_y2": 271.1,
"r_x3": 346.4,
"r_y3": 271.1,
"coord_origin": "TOPLEFT"
},
"text": "-coordinates and cell sizes.",
"orig": "-coordinates and cell sizes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 6,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 283.4,
"r": 545.1,
"b": 387.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 292.3,
"r_x1": 328.4,
"r_y1": 292.3,
"r_x2": 328.4,
"r_y2": 283.4,
"r_x3": 320.8,
"r_y3": 283.4,
"coord_origin": "TOPLEFT"
},
"text": "7.",
"orig": "7.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.9,
"r_y0": 292.3,
"r_x1": 545.1,
"r_y1": 292.3,
"r_x2": 545.1,
"r_y2": 283.4,
"r_x3": 330.9,
"r_y3": 283.4,
"coord_origin": "TOPLEFT"
},
"text": "Generate a new set of pair-wise matches between the",
"orig": "Generate a new set of pair-wise matches between the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 304.2,
"r_x1": 545.1,
"r_y1": 304.2,
"r_x2": 545.1,
"r_y2": 295.3,
"r_x3": 308.9,
"r_y3": 295.3,
"coord_origin": "TOPLEFT"
},
"text": "corrected bounding boxes and PDF cells. This time use a",
"orig": "corrected bounding boxes and PDF cells. This time use a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 316.2,
"r_x1": 545.1,
"r_y1": 316.2,
"r_x2": 545.1,
"r_y2": 307.3,
"r_x3": 308.9,
"r_y3": 307.3,
"coord_origin": "TOPLEFT"
},
"text": "modified version of the IOU metric, where the area of the",
"orig": "modified version of the IOU metric, where the area of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 328.1,
"r_x1": 545.1,
"r_y1": 328.1,
"r_x2": 545.1,
"r_y2": 319.2,
"r_x3": 308.9,
"r_y3": 319.2,
"coord_origin": "TOPLEFT"
},
"text": "intersection between the predicted and PDF cells is divided",
"orig": "intersection between the predicted and PDF cells is divided",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 340.1,
"r_x1": 397.2,
"r_y1": 340.1,
"r_x2": 397.2,
"r_y2": 331.2,
"r_x3": 308.9,
"r_y3": 331.2,
"coord_origin": "TOPLEFT"
},
"text": "by the PDF cell area.",
"orig": "by the PDF cell area.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.7,
"r_y0": 340.1,
"r_x1": 545.1,
"r_y1": 340.1,
"r_x2": 545.1,
"r_y2": 331.2,
"r_x3": 403.7,
"r_y3": 331.2,
"coord_origin": "TOPLEFT"
},
"text": "In case there are multiple matches",
"orig": "In case there are multiple matches",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 352.0,
"r_x1": 545.1,
"r_y1": 352.0,
"r_x2": 545.1,
"r_y2": 343.1,
"r_x3": 308.9,
"r_y3": 343.1,
"coord_origin": "TOPLEFT"
},
"text": "for the same PDF cell, the prediction with the higher score",
"orig": "for the same PDF cell, the prediction with the higher score",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 364.0,
"r_x1": 545.1,
"r_y1": 364.0,
"r_x2": 545.1,
"r_y2": 355.1,
"r_x3": 308.9,
"r_y3": 355.1,
"coord_origin": "TOPLEFT"
},
"text": "is preferred. This covers the cases where the PDF cells are",
"orig": "is preferred. This covers the cases where the PDF cells are",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 376.0,
"r_x1": 545.1,
"r_y1": 376.0,
"r_x2": 545.1,
"r_y2": 367.0,
"r_x3": 308.9,
"r_y3": 367.0,
"coord_origin": "TOPLEFT"
},
"text": "smaller than the area of predicted or corrected prediction",
"orig": "smaller than the area of predicted or corrected prediction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 387.9,
"r_x1": 329.6,
"r_y1": 387.9,
"r_x2": 329.6,
"r_y2": 379.0,
"r_x3": 308.9,
"r_y3": 379.0,
"coord_origin": "TOPLEFT"
},
"text": "cells.",
"orig": "cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 17,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 391.3,
"r": 545.1,
"b": 460.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.87,
"cells": [
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 400.2,
"r_x1": 328.6,
"r_y1": 400.2,
"r_x2": 328.6,
"r_y2": 391.3,
"r_x3": 320.8,
"r_y3": 391.3,
"coord_origin": "TOPLEFT"
},
"text": "8.",
"orig": "8.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.1,
"r_y0": 400.2,
"r_x1": 545.1,
"r_y1": 400.2,
"r_x2": 545.1,
"r_y2": 391.3,
"r_x3": 331.1,
"r_y3": 391.3,
"coord_origin": "TOPLEFT"
},
"text": "In some rare occasions, we have noticed that Table-",
"orig": "In some rare occasions, we have noticed that Table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 412.2,
"r_x1": 545.1,
"r_y1": 412.2,
"r_x2": 545.1,
"r_y2": 403.3,
"r_x3": 308.9,
"r_y3": 403.3,
"coord_origin": "TOPLEFT"
},
"text": "Former can confuse a single column as two. When the post-",
"orig": "Former can confuse a single column as two. When the post-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 424.1,
"r_x1": 545.1,
"r_y1": 424.1,
"r_x2": 545.1,
"r_y2": 415.2,
"r_x3": 308.9,
"r_y3": 415.2,
"coord_origin": "TOPLEFT"
},
"text": "processing steps are applied, this results with two predicted",
"orig": "processing steps are applied, this results with two predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 436.1,
"r_x1": 545.1,
"r_y1": 436.1,
"r_x2": 545.1,
"r_y2": 427.2,
"r_x3": 308.9,
"r_y3": 427.2,
"coord_origin": "TOPLEFT"
},
"text": "columns pointing to the same PDF column. In such case",
"orig": "columns pointing to the same PDF column. In such case",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 448.0,
"r_x1": 545.1,
"r_y1": 448.0,
"r_x2": 545.1,
"r_y2": 439.1,
"r_x3": 308.9,
"r_y3": 439.1,
"coord_origin": "TOPLEFT"
},
"text": "we must de-duplicate the columns according to highest to-",
"orig": "we must de-duplicate the columns according to highest to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 460.0,
"r_x1": 426.2,
"r_y1": 460.0,
"r_x2": 426.2,
"r_y2": 451.1,
"r_x3": 308.9,
"r_y3": 451.1,
"coord_origin": "TOPLEFT"
},
"text": "tal column intersection score.",
"orig": "tal column intersection score.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 15,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 463.4,
"r": 545.1,
"b": 567.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 472.3,
"r_x1": 328.7,
"r_y1": 472.3,
"r_x2": 328.7,
"r_y2": 463.4,
"r_x3": 320.8,
"r_y3": 463.4,
"coord_origin": "TOPLEFT"
},
"text": "9.",
"orig": "9.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.3,
"r_y0": 472.3,
"r_x1": 545.1,
"r_y1": 472.3,
"r_x2": 545.1,
"r_y2": 463.4,
"r_x3": 331.3,
"r_y3": 463.4,
"coord_origin": "TOPLEFT"
},
"text": "Pick up the remaining orphan cells. There could be",
"orig": "Pick up the remaining orphan cells. There could be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 484.3,
"r_x1": 545.1,
"r_y1": 484.3,
"r_x2": 545.1,
"r_y2": 475.3,
"r_x3": 308.9,
"r_y3": 475.3,
"coord_origin": "TOPLEFT"
},
"text": "cases, when after applying all the previous post-processing",
"orig": "cases, when after applying all the previous post-processing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 496.2,
"r_x1": 545.1,
"r_y1": 496.2,
"r_x2": 545.1,
"r_y2": 487.3,
"r_x3": 308.9,
"r_y3": 487.3,
"coord_origin": "TOPLEFT"
},
"text": "steps, some PDF cells could still remain without any match",
"orig": "steps, some PDF cells could still remain without any match",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 508.2,
"r_x1": 381.9,
"r_y1": 508.2,
"r_x2": 381.9,
"r_y2": 499.3,
"r_x3": 308.9,
"r_y3": 499.3,
"coord_origin": "TOPLEFT"
},
"text": "to predicted cells.",
"orig": "to predicted cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 388.7,
"r_y0": 508.2,
"r_x1": 545.1,
"r_y1": 508.2,
"r_x2": 545.1,
"r_y2": 499.3,
"r_x3": 388.7,
"r_y3": 499.3,
"coord_origin": "TOPLEFT"
},
"text": "However, it is still possible to deduce",
"orig": "However, it is still possible to deduce",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 520.1,
"r_x1": 545.1,
"r_y1": 520.1,
"r_x2": 545.1,
"r_y2": 511.2,
"r_x3": 308.9,
"r_y3": 511.2,
"coord_origin": "TOPLEFT"
},
"text": "the correct matching for an orphan PDF cell by mapping its",
"orig": "the correct matching for an orphan PDF cell by mapping its",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 532.1,
"r_x1": 545.1,
"r_y1": 532.1,
"r_x2": 545.1,
"r_y2": 523.2,
"r_x3": 308.9,
"r_y3": 523.2,
"coord_origin": "TOPLEFT"
},
"text": "bounding box on the geometry of the grid. This mapping",
"orig": "bounding box on the geometry of the grid. This mapping",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 544.0,
"r_x1": 545.1,
"r_y1": 544.0,
"r_x2": 545.1,
"r_y2": 535.1,
"r_x3": 308.9,
"r_y3": 535.1,
"coord_origin": "TOPLEFT"
},
"text": "decides if the content of the orphan cell will be appended to",
"orig": "decides if the content of the orphan cell will be appended to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 556.0,
"r_x1": 545.1,
"r_y1": 556.0,
"r_x2": 545.1,
"r_y2": 547.1,
"r_x3": 308.9,
"r_y3": 547.1,
"coord_origin": "TOPLEFT"
},
"text": "an already matched table cell, or a new table cell should be",
"orig": "an already matched table cell, or a new table cell should be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 567.9,
"r_x1": 442.2,
"r_y1": 567.9,
"r_x2": 442.2,
"r_y2": 559.0,
"r_x3": 308.9,
"r_y3": 559.0,
"coord_origin": "TOPLEFT"
},
"text": "created to match with the orphan.",
"orig": "created to match with the orphan.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 19,
"label": "text",
"bbox": {
"l": 308.9,
"t": 571.3,
"r": 545.1,
"b": 604.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.85,
"cells": [
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 580.2,
"r_x1": 545.1,
"r_y1": 580.2,
"r_x2": 545.1,
"r_y2": 571.3,
"r_x3": 320.8,
"r_y3": 571.3,
"coord_origin": "TOPLEFT"
},
"text": "9a. Compute the top and bottom boundary of the hori-",
"orig": "9a. Compute the top and bottom boundary of the hori-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 592.2,
"r_x1": 471.6,
"r_y1": 592.2,
"r_x2": 471.6,
"r_y2": 583.3,
"r_x3": 308.9,
"r_y3": 583.3,
"coord_origin": "TOPLEFT"
},
"text": "zontal band for each grid row (min/max",
"orig": "zontal band for each grid row (min/max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 474.8,
"r_y0": 592.0,
"r_x1": 479.7,
"r_y1": 592.0,
"r_x2": 479.7,
"r_y2": 583.1,
"r_x3": 474.8,
"r_y3": 583.1,
"coord_origin": "TOPLEFT"
},
"text": "y",
"orig": "y",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.3,
"r_y0": 592.2,
"r_x1": 545.1,
"r_y1": 592.2,
"r_x2": 545.1,
"r_y2": 583.3,
"r_x3": 483.3,
"r_y3": 583.3,
"coord_origin": "TOPLEFT"
},
"text": "coordinates per",
"orig": "coordinates per",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 604.2,
"r_x1": 329.9,
"r_y1": 604.2,
"r_x2": 329.9,
"r_y2": 595.2,
"r_x3": 308.9,
"r_y3": 595.2,
"coord_origin": "TOPLEFT"
},
"text": "row).",
"orig": "row).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 21,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 607.6,
"r": 545.1,
"b": 628.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.77,
"cells": [
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 616.5,
"r_x1": 332.9,
"r_y1": 616.5,
"r_x2": 332.9,
"r_y2": 607.6,
"r_x3": 320.8,
"r_y3": 607.6,
"coord_origin": "TOPLEFT"
},
"text": "9b.",
"orig": "9b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.9,
"r_y0": 616.5,
"r_x1": 545.1,
"r_y1": 616.5,
"r_x2": 545.1,
"r_y2": 607.6,
"r_x3": 339.9,
"r_y3": 607.6,
"coord_origin": "TOPLEFT"
},
"text": "Intersect the orphan\u2019s bounding box with the row",
"orig": "Intersect the orphan\u2019s bounding box with the row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 628.4,
"r_x1": 495.3,
"r_y1": 628.4,
"r_x2": 495.3,
"r_y2": 619.5,
"r_x3": 308.9,
"r_y3": 619.5,
"coord_origin": "TOPLEFT"
},
"text": "bands, and map the cell to the closest grid row.",
"orig": "bands, and map the cell to the closest grid row.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 18,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 631.8,
"r": 545.1,
"b": 664.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.86,
"cells": [
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 640.7,
"r_x1": 545.1,
"r_y1": 640.7,
"r_x2": 545.1,
"r_y2": 631.8,
"r_x3": 320.8,
"r_y3": 631.8,
"coord_origin": "TOPLEFT"
},
"text": "9c. Compute the left and right boundary of the vertical",
"orig": "9c. Compute the left and right boundary of the vertical",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 652.7,
"r_x1": 455.3,
"r_y1": 652.7,
"r_x2": 455.3,
"r_y2": 643.8,
"r_x3": 308.9,
"r_y3": 643.8,
"coord_origin": "TOPLEFT"
},
"text": "band for each grid column (min/max",
"orig": "band for each grid column (min/max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 457.8,
"r_y0": 652.5,
"r_x1": 463.5,
"r_y1": 652.5,
"r_x2": 463.5,
"r_y2": 643.6,
"r_x3": 457.8,
"r_y3": 643.6,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.0,
"r_y0": 652.7,
"r_x1": 545.1,
"r_y1": 652.7,
"r_x2": 545.1,
"r_y2": 643.8,
"r_x3": 466.0,
"r_y3": 643.8,
"coord_origin": "TOPLEFT"
},
"text": "coordinates per col-",
"orig": "coordinates per col-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 664.6,
"r_x1": 332.4,
"r_y1": 664.6,
"r_x2": 332.4,
"r_y2": 655.7,
"r_x3": 308.9,
"r_y3": 655.7,
"coord_origin": "TOPLEFT"
},
"text": "umn).",
"orig": "umn).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 22,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 668.0,
"r": 545.1,
"b": 688.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.76,
"cells": [
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 676.9,
"r_x1": 545.1,
"r_y1": 676.9,
"r_x2": 545.1,
"r_y2": 668.0,
"r_x3": 320.8,
"r_y3": 668.0,
"coord_origin": "TOPLEFT"
},
"text": "9d. Intersect the orphan\u2019s bounding box with the column",
"orig": "9d. Intersect the orphan\u2019s bounding box with the column",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 688.9,
"r_x1": 510.6,
"r_y1": 688.9,
"r_x2": 510.6,
"r_y2": 680.0,
"r_x3": 308.9,
"r_y3": 680.0,
"coord_origin": "TOPLEFT"
},
"text": "bands, and map the cell to the closest grid column.",
"orig": "bands, and map the cell to the closest grid column.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 25,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 692.3,
"r": 545.1,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.7,
"cells": [
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 320.8,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "9e. If the table cell under the identified row and column",
"orig": "9e. If the table cell under the identified row and column",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 545.1,
"r_y1": 713.2,
"r_x2": 545.1,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "is not empty, extend its content with the content of the or-",
"orig": "is not empty, extend its content with the content of the or-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 14,
"label": "page_footer",
"bbox": {
"l": 292.6,
"t": 734.1,
"r": 302.6,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"tablestructure": {
"table_map": {}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "picture",
"id": 30,
"page_no": 11,
"cluster": {
"id": 30,
"label": "picture",
"bbox": {
"l": 53.5,
"t": 74.7,
"r": 544.9,
"b": 147.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.6,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.4,
"r_y0": 83.3,
"r_x1": 151.9,
"r_y1": 83.3,
"r_x2": 151.9,
"r_y2": 77.3,
"r_x3": 119.4,
"r_y3": 77.3,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.3,
"r_y0": 81.1,
"r_x1": 59.3,
"r_y1": 81.1,
"r_x2": 59.3,
"r_y2": 75.2,
"r_x3": 53.3,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.6,
"r_y0": 83.4,
"r_x1": 319.8,
"r_y1": 83.4,
"r_x2": 319.8,
"r_y2": 77.5,
"r_x3": 289.6,
"r_y3": 77.5,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.4,
"r_y0": 83.2,
"r_x1": 481.8,
"r_y1": 83.2,
"r_x2": 481.8,
"r_y2": 77.3,
"r_x3": 448.4,
"r_y3": 77.3,
"coord_origin": "TOPLEFT"
},
"text": "Table Bank",
"orig": "Table Bank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.6,
"r_y0": 146.2,
"r_x1": 95.0,
"r_y1": 146.2,
"r_x2": 95.0,
"r_y2": 141.3,
"r_x3": 82.6,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Train",
"orig": "Train",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 63.0,
"r_y0": 106.1,
"r_x1": 85.3,
"r_y1": 106.1,
"r_x2": 85.3,
"r_y2": 101.1,
"r_x3": 63.0,
"r_y3": 101.1,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 129.4,
"r_x1": 85.2,
"r_y1": 129.4,
"r_x2": 85.2,
"r_y2": 124.4,
"r_x3": 67.8,
"r_y3": 124.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.6,
"r_y0": 107.5,
"r_x1": 249.8,
"r_y1": 107.5,
"r_x2": 249.8,
"r_y2": 102.5,
"r_x3": 227.6,
"r_y3": 102.5,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.2,
"r_y0": 131.9,
"r_x1": 249.7,
"r_y1": 131.9,
"r_x2": 249.7,
"r_y2": 127.0,
"r_x3": 232.2,
"r_y3": 127.0,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 119.0,
"r_x1": 413.7,
"r_y1": 119.0,
"r_x2": 413.7,
"r_y2": 114.0,
"r_x3": 396.2,
"r_y3": 114.0,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 97.4,
"r_y0": 146.2,
"r_x1": 105.1,
"r_y1": 146.2,
"r_x2": 105.1,
"r_y2": 141.3,
"r_x3": 97.4,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Val",
"orig": "Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.9,
"r_y0": 90.7,
"r_x1": 76.2,
"r_y1": 90.7,
"r_x2": 76.2,
"r_y2": 85.7,
"r_x3": 60.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.3,
"r_y0": 91.2,
"r_x1": 107.0,
"r_y1": 91.2,
"r_x2": 107.0,
"r_y2": 86.2,
"r_x3": 82.3,
"r_y3": 86.2,
"coord_origin": "TOPLEFT"
},
"text": "500K 10K",
"orig": "500K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.2,
"r_y0": 146.6,
"r_x1": 281.9,
"r_y1": 146.6,
"r_x2": 281.9,
"r_y2": 141.6,
"r_x3": 246.2,
"r_y3": 141.6,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 226.7,
"r_y0": 90.7,
"r_x1": 241.9,
"r_y1": 90.7,
"r_x2": 241.9,
"r_y2": 85.7,
"r_x3": 226.7,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 249.9,
"r_y0": 91.0,
"r_x1": 282.5,
"r_y1": 91.0,
"r_x2": 282.5,
"r_y2": 86.1,
"r_x3": 249.9,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "91K 10K 10K",
"orig": "91K 10K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.2,
"r_y0": 146.2,
"r_x1": 444.7,
"r_y1": 146.2,
"r_x2": 444.7,
"r_y2": 141.3,
"r_x3": 410.2,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.4,
"r_y0": 90.7,
"r_x1": 432.7,
"r_y1": 90.7,
"r_x2": 432.7,
"r_y2": 85.7,
"r_x3": 391.4,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "100% 130K 5K",
"orig": "100% 130K 5K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 435.6,
"r_y0": 91.2,
"r_x1": 445.6,
"r_y1": 91.2,
"r_x2": 445.6,
"r_y2": 86.3,
"r_x3": 435.6,
"r_y3": 86.3,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.9,
"r_y0": 146.2,
"r_x1": 136.2,
"r_y1": 146.2,
"r_x2": 136.2,
"r_y2": 141.3,
"r_x3": 113.9,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.9,
"r_y0": 99.8,
"r_x1": 127.1,
"r_y1": 99.8,
"r_x2": 127.1,
"r_y2": 94.8,
"r_x3": 116.9,
"r_y3": 94.8,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.3,
"r_y0": 105.9,
"r_x1": 127.1,
"r_y1": 105.9,
"r_x2": 127.1,
"r_y2": 100.9,
"r_x3": 113.3,
"r_y3": 100.9,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.9,
"r_y0": 112.0,
"r_x1": 127.1,
"r_y1": 112.0,
"r_x2": 127.1,
"r_y2": 107.1,
"r_x3": 112.9,
"r_y3": 107.1,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.2,
"r_y0": 127.6,
"r_x1": 127.0,
"r_y1": 127.6,
"r_x2": 127.0,
"r_y2": 122.6,
"r_x3": 113.2,
"r_y3": 122.6,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.9,
"r_y0": 133.7,
"r_x1": 127.0,
"r_y1": 133.7,
"r_x2": 127.0,
"r_y2": 128.7,
"r_x3": 112.9,
"r_y3": 128.7,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.6,
"r_y0": 146.4,
"r_x1": 156.0,
"r_y1": 146.4,
"r_x2": 156.0,
"r_y2": 141.4,
"r_x3": 138.6,
"r_y3": 141.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.0,
"r_y0": 91.2,
"r_x1": 151.0,
"r_y1": 91.2,
"r_x2": 151.0,
"r_y2": 86.3,
"r_x3": 122.0,
"r_y3": 86.3,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.7,
"r_y0": 91.5,
"r_x1": 321.7,
"r_y1": 91.5,
"r_x2": 321.7,
"r_y2": 86.6,
"r_x3": 311.7,
"r_y3": 86.6,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 287.9,
"r_y0": 146.7,
"r_x1": 310.1,
"r_y1": 146.7,
"r_x2": 310.1,
"r_y2": 141.7,
"r_x3": 287.9,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.2,
"r_y0": 98.0,
"r_x1": 299.4,
"r_y1": 98.0,
"r_x2": 299.4,
"r_y2": 93.1,
"r_x3": 289.2,
"r_y3": 93.1,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.6,
"r_y0": 104.2,
"r_x1": 299.4,
"r_y1": 104.2,
"r_x2": 299.4,
"r_y2": 99.2,
"r_x3": 285.6,
"r_y3": 99.2,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.3,
"r_y0": 110.3,
"r_x1": 299.4,
"r_y1": 110.3,
"r_x2": 299.4,
"r_y2": 105.3,
"r_x3": 285.3,
"r_y3": 105.3,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.4,
"r_y0": 125.3,
"r_x1": 299.2,
"r_y1": 125.3,
"r_x2": 299.2,
"r_y2": 120.4,
"r_x3": 285.4,
"r_y3": 120.4,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.1,
"r_y0": 131.5,
"r_x1": 299.2,
"r_y1": 131.5,
"r_x2": 299.2,
"r_y2": 126.5,
"r_x3": 285.1,
"r_y3": 126.5,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.3,
"r_y0": 146.7,
"r_x1": 328.8,
"r_y1": 146.7,
"r_x2": 328.8,
"r_y2": 141.7,
"r_x3": 311.3,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 299.6,
"r_y0": 91.7,
"r_x1": 309.6,
"r_y1": 91.7,
"r_x2": 309.6,
"r_y2": 86.7,
"r_x3": 299.6,
"r_y3": 86.7,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.0,
"r_y0": 146.6,
"r_x1": 483.5,
"r_y1": 146.6,
"r_x2": 483.5,
"r_y2": 141.7,
"r_x3": 466.0,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.0,
"r_y0": 98.7,
"r_x1": 469.2,
"r_y1": 98.7,
"r_x2": 469.2,
"r_y2": 93.8,
"r_x3": 459.0,
"r_y3": 93.8,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.4,
"r_y0": 104.8,
"r_x1": 469.2,
"r_y1": 104.8,
"r_x2": 469.2,
"r_y2": 99.9,
"r_x3": 455.4,
"r_y3": 99.9,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.0,
"r_y0": 111.0,
"r_x1": 469.2,
"r_y1": 111.0,
"r_x2": 469.2,
"r_y2": 106.0,
"r_x3": 455.0,
"r_y3": 106.0,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 467.4,
"r_y0": 90.5,
"r_x1": 480.7,
"r_y1": 90.5,
"r_x2": 480.7,
"r_y2": 85.6,
"r_x3": 467.4,
"r_y3": 85.6,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.4,
"r_y0": 146.5,
"r_x1": 182.6,
"r_y1": 146.5,
"r_x2": 182.6,
"r_y2": 141.6,
"r_x3": 160.4,
"r_y3": 141.6,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 153.7,
"r_y0": 99.8,
"r_x1": 173.3,
"r_y1": 99.8,
"r_x2": 173.3,
"r_y2": 94.9,
"r_x3": 153.7,
"r_y3": 94.9,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 154.5,
"r_y0": 105.9,
"r_x1": 173.3,
"r_y1": 105.9,
"r_x2": 173.3,
"r_y2": 101.0,
"r_x3": 154.5,
"r_y3": 101.0,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 155.3,
"r_y0": 112.1,
"r_x1": 173.3,
"r_y1": 112.1,
"r_x2": 173.3,
"r_y2": 107.1,
"r_x3": 155.3,
"r_y3": 107.1,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.4,
"r_y0": 112.2,
"r_x1": 346.0,
"r_y1": 112.2,
"r_x2": 346.0,
"r_y2": 107.2,
"r_x3": 326.4,
"r_y3": 107.2,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.2,
"r_y0": 118.3,
"r_x1": 346.0,
"r_y1": 118.3,
"r_x2": 346.0,
"r_y2": 113.4,
"r_x3": 327.2,
"r_y3": 113.4,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.9,
"r_y0": 124.4,
"r_x1": 346.0,
"r_y1": 124.4,
"r_x2": 346.0,
"r_y2": 119.5,
"r_x3": 327.9,
"r_y3": 119.5,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.0,
"r_y0": 109.1,
"r_x1": 508.8,
"r_y1": 109.1,
"r_x2": 508.8,
"r_y2": 104.2,
"r_x3": 489.0,
"r_y3": 104.2,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.2,
"r_y0": 115.2,
"r_x1": 508.8,
"r_y1": 115.2,
"r_x2": 508.8,
"r_y2": 110.3,
"r_x3": 490.2,
"r_y3": 110.3,
"coord_origin": "TOPLEFT"
},
"text": "doesn't",
"orig": "doesn't",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.7,
"r_y0": 121.4,
"r_x1": 508.8,
"r_y1": 121.4,
"r_x2": 508.8,
"r_y2": 116.4,
"r_x3": 489.7,
"r_y3": 116.4,
"coord_origin": "TOPLEFT"
},
"text": "provide",
"orig": "provide",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.7,
"r_y0": 127.5,
"r_x1": 508.8,
"r_y1": 127.5,
"r_x2": 508.8,
"r_y2": 122.5,
"r_x3": 490.7,
"r_y3": 122.5,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.4,
"r_y0": 146.7,
"r_x1": 202.8,
"r_y1": 146.7,
"r_x2": 202.8,
"r_y2": 141.7,
"r_x3": 185.4,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 168.5,
"r_y0": 91.1,
"r_x1": 197.5,
"r_y1": 91.1,
"r_x2": 197.5,
"r_y2": 86.1,
"r_x3": 168.5,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.4,
"r_y0": 91.0,
"r_x1": 367.4,
"r_y1": 91.0,
"r_x2": 367.4,
"r_y2": 86.0,
"r_x3": 357.4,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.7,
"r_y0": 146.6,
"r_x1": 374.9,
"r_y1": 146.6,
"r_x2": 374.9,
"r_y2": 141.6,
"r_x3": 333.7,
"r_y3": 141.6,
"coord_origin": "TOPLEFT"
},
"text": "Complex Simple",
"orig": "Complex Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.7,
"r_y0": 91.0,
"r_x1": 355.7,
"r_y1": 91.0,
"r_x2": 355.7,
"r_y2": 86.1,
"r_x3": 345.7,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.5,
"r_y0": 146.3,
"r_x1": 526.0,
"r_y1": 146.3,
"r_x2": 526.0,
"r_y2": 141.4,
"r_x3": 508.5,
"r_y3": 141.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 510.4,
"r_y0": 91.0,
"r_x1": 523.7,
"r_y1": 91.0,
"r_x2": 523.7,
"r_y2": 86.1,
"r_x3": 510.4,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 46,
"label": "text",
"bbox": {
"l": 119.4,
"t": 77.3,
"r": 151.9,
"b": 83.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.4,
"r_y0": 83.3,
"r_x1": 151.9,
"r_y1": 83.3,
"r_x2": 151.9,
"r_y2": 77.3,
"r_x3": 119.4,
"r_y3": 77.3,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 53.3,
"t": 75.2,
"r": 59.3,
"b": 81.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.3,
"r_y0": 81.1,
"r_x1": 59.3,
"r_y1": 81.1,
"r_x2": 59.3,
"r_y2": 75.2,
"r_x3": 53.3,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 289.6,
"t": 77.5,
"r": 319.8,
"b": 83.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.6,
"r_y0": 83.4,
"r_x1": 319.8,
"r_y1": 83.4,
"r_x2": 319.8,
"r_y2": 77.5,
"r_x3": 289.6,
"r_y3": 77.5,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 448.4,
"t": 77.3,
"r": 481.8,
"b": 83.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.4,
"r_y0": 83.2,
"r_x1": 481.8,
"r_y1": 83.2,
"r_x2": 481.8,
"r_y2": 77.3,
"r_x3": 448.4,
"r_y3": 77.3,
"coord_origin": "TOPLEFT"
},
"text": "Table Bank",
"orig": "Table Bank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 82.6,
"t": 141.3,
"r": 95.0,
"b": 146.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.6,
"r_y0": 146.2,
"r_x1": 95.0,
"r_y1": 146.2,
"r_x2": 95.0,
"r_y2": 141.3,
"r_x3": 82.6,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Train",
"orig": "Train",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 51,
"label": "text",
"bbox": {
"l": 63.0,
"t": 101.1,
"r": 85.3,
"b": 106.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 63.0,
"r_y0": 106.1,
"r_x1": 85.3,
"r_y1": 106.1,
"r_x2": 85.3,
"r_y2": 101.1,
"r_x3": 63.0,
"r_y3": 101.1,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 52,
"label": "text",
"bbox": {
"l": 67.8,
"t": 124.4,
"r": 85.2,
"b": 129.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 129.4,
"r_x1": 85.2,
"r_y1": 129.4,
"r_x2": 85.2,
"r_y2": 124.4,
"r_x3": 67.8,
"r_y3": 124.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 53,
"label": "text",
"bbox": {
"l": 227.6,
"t": 102.5,
"r": 249.8,
"b": 107.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.6,
"r_y0": 107.5,
"r_x1": 249.8,
"r_y1": 107.5,
"r_x2": 249.8,
"r_y2": 102.5,
"r_x3": 227.6,
"r_y3": 102.5,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 54,
"label": "text",
"bbox": {
"l": 232.2,
"t": 127.0,
"r": 249.7,
"b": 131.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.2,
"r_y0": 131.9,
"r_x1": 249.7,
"r_y1": 131.9,
"r_x2": 249.7,
"r_y2": 127.0,
"r_x3": 232.2,
"r_y3": 127.0,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 55,
"label": "text",
"bbox": {
"l": 396.2,
"t": 114.0,
"r": 413.7,
"b": 119.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 119.0,
"r_x1": 413.7,
"r_y1": 119.0,
"r_x2": 413.7,
"r_y2": 114.0,
"r_x3": 396.2,
"r_y3": 114.0,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 97.4,
"t": 141.3,
"r": 105.1,
"b": 146.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 97.4,
"r_y0": 146.2,
"r_x1": 105.1,
"r_y1": 146.2,
"r_x2": 105.1,
"r_y2": 141.3,
"r_x3": 97.4,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Val",
"orig": "Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 60.9,
"t": 85.7,
"r": 76.2,
"b": 90.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.9,
"r_y0": 90.7,
"r_x1": 76.2,
"r_y1": 90.7,
"r_x2": 76.2,
"r_y2": 85.7,
"r_x3": 60.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 82.3,
"t": 86.2,
"r": 107.0,
"b": 91.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.3,
"r_y0": 91.2,
"r_x1": 107.0,
"r_y1": 91.2,
"r_x2": 107.0,
"r_y2": 86.2,
"r_x3": 82.3,
"r_y3": 86.2,
"coord_origin": "TOPLEFT"
},
"text": "500K 10K",
"orig": "500K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 246.2,
"t": 141.6,
"r": 281.9,
"b": 146.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.2,
"r_y0": 146.6,
"r_x1": 281.9,
"r_y1": 146.6,
"r_x2": 281.9,
"r_y2": 141.6,
"r_x3": 246.2,
"r_y3": 141.6,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 226.7,
"t": 85.7,
"r": 241.9,
"b": 90.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 226.7,
"r_y0": 90.7,
"r_x1": 241.9,
"r_y1": 90.7,
"r_x2": 241.9,
"r_y2": 85.7,
"r_x3": 226.7,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 249.9,
"t": 86.1,
"r": 282.5,
"b": 91.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 249.9,
"r_y0": 91.0,
"r_x1": 282.5,
"r_y1": 91.0,
"r_x2": 282.5,
"r_y2": 86.1,
"r_x3": 249.9,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "91K 10K 10K",
"orig": "91K 10K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 410.2,
"t": 141.3,
"r": 444.7,
"b": 146.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.2,
"r_y0": 146.2,
"r_x1": 444.7,
"r_y1": 146.2,
"r_x2": 444.7,
"r_y2": 141.3,
"r_x3": 410.2,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 391.4,
"t": 85.7,
"r": 432.7,
"b": 90.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.4,
"r_y0": 90.7,
"r_x1": 432.7,
"r_y1": 90.7,
"r_x2": 432.7,
"r_y2": 85.7,
"r_x3": 391.4,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "100% 130K 5K",
"orig": "100% 130K 5K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 435.6,
"t": 86.3,
"r": 445.6,
"b": 91.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 435.6,
"r_y0": 91.2,
"r_x1": 445.6,
"r_y1": 91.2,
"r_x2": 445.6,
"r_y2": 86.3,
"r_x3": 435.6,
"r_y3": 86.3,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 113.9,
"t": 141.3,
"r": 136.2,
"b": 146.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.9,
"r_y0": 146.2,
"r_x1": 136.2,
"r_y1": 146.2,
"r_x2": 136.2,
"r_y2": 141.3,
"r_x3": 113.9,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 116.9,
"t": 94.8,
"r": 127.1,
"b": 99.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.9,
"r_y0": 99.8,
"r_x1": 127.1,
"r_y1": 99.8,
"r_x2": 127.1,
"r_y2": 94.8,
"r_x3": 116.9,
"r_y3": 94.8,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 113.3,
"t": 100.9,
"r": 127.1,
"b": 105.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.3,
"r_y0": 105.9,
"r_x1": 127.1,
"r_y1": 105.9,
"r_x2": 127.1,
"r_y2": 100.9,
"r_x3": 113.3,
"r_y3": 100.9,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 112.9,
"t": 107.1,
"r": 127.1,
"b": 112.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.9,
"r_y0": 112.0,
"r_x1": 127.1,
"r_y1": 112.0,
"r_x2": 127.1,
"r_y2": 107.1,
"r_x3": 112.9,
"r_y3": 107.1,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 113.2,
"t": 122.6,
"r": 127.0,
"b": 127.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.2,
"r_y0": 127.6,
"r_x1": 127.0,
"r_y1": 127.6,
"r_x2": 127.0,
"r_y2": 122.6,
"r_x3": 113.2,
"r_y3": 122.6,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 112.9,
"t": 128.7,
"r": 127.0,
"b": 133.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.9,
"r_y0": 133.7,
"r_x1": 127.0,
"r_y1": 133.7,
"r_x2": 127.0,
"r_y2": 128.7,
"r_x3": 112.9,
"r_y3": 128.7,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 138.6,
"t": 141.4,
"r": 156.0,
"b": 146.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.6,
"r_y0": 146.4,
"r_x1": 156.0,
"r_y1": 146.4,
"r_x2": 156.0,
"r_y2": 141.4,
"r_x3": 138.6,
"r_y3": 141.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 122.0,
"t": 86.3,
"r": 151.0,
"b": 91.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.0,
"r_y0": 91.2,
"r_x1": 151.0,
"r_y1": 91.2,
"r_x2": 151.0,
"r_y2": 86.3,
"r_x3": 122.0,
"r_y3": 86.3,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 311.7,
"t": 86.6,
"r": 321.7,
"b": 91.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.7,
"r_y0": 91.5,
"r_x1": 321.7,
"r_y1": 91.5,
"r_x2": 321.7,
"r_y2": 86.6,
"r_x3": 311.7,
"r_y3": 86.6,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 287.9,
"t": 141.7,
"r": 310.1,
"b": 146.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 287.9,
"r_y0": 146.7,
"r_x1": 310.1,
"r_y1": 146.7,
"r_x2": 310.1,
"r_y2": 141.7,
"r_x3": 287.9,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 289.2,
"t": 93.1,
"r": 299.4,
"b": 98.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.2,
"r_y0": 98.0,
"r_x1": 299.4,
"r_y1": 98.0,
"r_x2": 299.4,
"r_y2": 93.1,
"r_x3": 289.2,
"r_y3": 93.1,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 285.6,
"t": 99.2,
"r": 299.4,
"b": 104.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.6,
"r_y0": 104.2,
"r_x1": 299.4,
"r_y1": 104.2,
"r_x2": 299.4,
"r_y2": 99.2,
"r_x3": 285.6,
"r_y3": 99.2,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 285.3,
"t": 105.3,
"r": 299.4,
"b": 110.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.3,
"r_y0": 110.3,
"r_x1": 299.4,
"r_y1": 110.3,
"r_x2": 299.4,
"r_y2": 105.3,
"r_x3": 285.3,
"r_y3": 105.3,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 285.4,
"t": 120.4,
"r": 299.2,
"b": 125.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.4,
"r_y0": 125.3,
"r_x1": 299.2,
"r_y1": 125.3,
"r_x2": 299.2,
"r_y2": 120.4,
"r_x3": 285.4,
"r_y3": 120.4,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 285.1,
"t": 126.5,
"r": 299.2,
"b": 131.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.1,
"r_y0": 131.5,
"r_x1": 299.2,
"r_y1": 131.5,
"r_x2": 299.2,
"r_y2": 126.5,
"r_x3": 285.1,
"r_y3": 126.5,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 311.3,
"t": 141.7,
"r": 328.8,
"b": 146.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.3,
"r_y0": 146.7,
"r_x1": 328.8,
"r_y1": 146.7,
"r_x2": 328.8,
"r_y2": 141.7,
"r_x3": 311.3,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 299.6,
"t": 86.7,
"r": 309.6,
"b": 91.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 299.6,
"r_y0": 91.7,
"r_x1": 309.6,
"r_y1": 91.7,
"r_x2": 309.6,
"r_y2": 86.7,
"r_x3": 299.6,
"r_y3": 86.7,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 466.0,
"t": 141.7,
"r": 483.5,
"b": 146.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.0,
"r_y0": 146.6,
"r_x1": 483.5,
"r_y1": 146.6,
"r_x2": 483.5,
"r_y2": 141.7,
"r_x3": 466.0,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 83,
"label": "text",
"bbox": {
"l": 459.0,
"t": 93.8,
"r": 469.2,
"b": 98.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.0,
"r_y0": 98.7,
"r_x1": 469.2,
"r_y1": 98.7,
"r_x2": 469.2,
"r_y2": 93.8,
"r_x3": 459.0,
"r_y3": 93.8,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 455.4,
"t": 99.9,
"r": 469.2,
"b": 104.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.4,
"r_y0": 104.8,
"r_x1": 469.2,
"r_y1": 104.8,
"r_x2": 469.2,
"r_y2": 99.9,
"r_x3": 455.4,
"r_y3": 99.9,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 455.0,
"t": 106.0,
"r": 469.2,
"b": 111.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.0,
"r_y0": 111.0,
"r_x1": 469.2,
"r_y1": 111.0,
"r_x2": 469.2,
"r_y2": 106.0,
"r_x3": 455.0,
"r_y3": 106.0,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 467.4,
"t": 85.6,
"r": 480.7,
"b": 90.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 467.4,
"r_y0": 90.5,
"r_x1": 480.7,
"r_y1": 90.5,
"r_x2": 480.7,
"r_y2": 85.6,
"r_x3": 467.4,
"r_y3": 85.6,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 160.4,
"t": 141.6,
"r": 182.6,
"b": 146.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.4,
"r_y0": 146.5,
"r_x1": 182.6,
"r_y1": 146.5,
"r_x2": 182.6,
"r_y2": 141.6,
"r_x3": 160.4,
"r_y3": 141.6,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 153.7,
"t": 94.9,
"r": 173.3,
"b": 99.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 153.7,
"r_y0": 99.8,
"r_x1": 173.3,
"r_y1": 99.8,
"r_x2": 173.3,
"r_y2": 94.9,
"r_x3": 153.7,
"r_y3": 94.9,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 154.5,
"t": 101.0,
"r": 173.3,
"b": 105.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 154.5,
"r_y0": 105.9,
"r_x1": 173.3,
"r_y1": 105.9,
"r_x2": 173.3,
"r_y2": 101.0,
"r_x3": 154.5,
"r_y3": 101.0,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 155.3,
"t": 107.1,
"r": 173.3,
"b": 112.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 155.3,
"r_y0": 112.1,
"r_x1": 173.3,
"r_y1": 112.1,
"r_x2": 173.3,
"r_y2": 107.1,
"r_x3": 155.3,
"r_y3": 107.1,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 326.4,
"t": 107.2,
"r": 346.0,
"b": 112.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.4,
"r_y0": 112.2,
"r_x1": 346.0,
"r_y1": 112.2,
"r_x2": 346.0,
"r_y2": 107.2,
"r_x3": 326.4,
"r_y3": 107.2,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 327.2,
"t": 113.4,
"r": 346.0,
"b": 118.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.2,
"r_y0": 118.3,
"r_x1": 346.0,
"r_y1": 118.3,
"r_x2": 346.0,
"r_y2": 113.4,
"r_x3": 327.2,
"r_y3": 113.4,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 327.9,
"t": 119.5,
"r": 346.0,
"b": 124.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.9,
"r_y0": 124.4,
"r_x1": 346.0,
"r_y1": 124.4,
"r_x2": 346.0,
"r_y2": 119.5,
"r_x3": 327.9,
"r_y3": 119.5,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 489.0,
"t": 104.2,
"r": 508.8,
"b": 109.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.0,
"r_y0": 109.1,
"r_x1": 508.8,
"r_y1": 109.1,
"r_x2": 508.8,
"r_y2": 104.2,
"r_x3": 489.0,
"r_y3": 104.2,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 490.2,
"t": 110.3,
"r": 508.8,
"b": 115.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.2,
"r_y0": 115.2,
"r_x1": 508.8,
"r_y1": 115.2,
"r_x2": 508.8,
"r_y2": 110.3,
"r_x3": 490.2,
"r_y3": 110.3,
"coord_origin": "TOPLEFT"
},
"text": "doesn't",
"orig": "doesn't",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 489.7,
"t": 116.4,
"r": 508.8,
"b": 121.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.7,
"r_y0": 121.4,
"r_x1": 508.8,
"r_y1": 121.4,
"r_x2": 508.8,
"r_y2": 116.4,
"r_x3": 489.7,
"r_y3": 116.4,
"coord_origin": "TOPLEFT"
},
"text": "provide",
"orig": "provide",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 490.7,
"t": 122.5,
"r": 508.8,
"b": 127.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.7,
"r_y0": 127.5,
"r_x1": 508.8,
"r_y1": 127.5,
"r_x2": 508.8,
"r_y2": 122.5,
"r_x3": 490.7,
"r_y3": 122.5,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 185.4,
"t": 141.7,
"r": 202.8,
"b": 146.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.4,
"r_y0": 146.7,
"r_x1": 202.8,
"r_y1": 146.7,
"r_x2": 202.8,
"r_y2": 141.7,
"r_x3": 185.4,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 99,
"label": "text",
"bbox": {
"l": 168.5,
"t": 86.1,
"r": 197.5,
"b": 91.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 168.5,
"r_y0": 91.1,
"r_x1": 197.5,
"r_y1": 91.1,
"r_x2": 197.5,
"r_y2": 86.1,
"r_x3": 168.5,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 357.4,
"t": 86.0,
"r": 367.4,
"b": 91.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.4,
"r_y0": 91.0,
"r_x1": 367.4,
"r_y1": 91.0,
"r_x2": 367.4,
"r_y2": 86.0,
"r_x3": 357.4,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 333.7,
"t": 141.6,
"r": 374.9,
"b": 146.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.7,
"r_y0": 146.6,
"r_x1": 374.9,
"r_y1": 146.6,
"r_x2": 374.9,
"r_y2": 141.6,
"r_x3": 333.7,
"r_y3": 141.6,
"coord_origin": "TOPLEFT"
},
"text": "Complex Simple",
"orig": "Complex Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 345.7,
"t": 86.1,
"r": 355.7,
"b": 91.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.7,
"r_y0": 91.0,
"r_x1": 355.7,
"r_y1": 91.0,
"r_x2": 355.7,
"r_y2": 86.1,
"r_x3": 345.7,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 508.5,
"t": 141.4,
"r": 526.0,
"b": 146.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.5,
"r_y0": 146.3,
"r_x1": 526.0,
"r_y1": 146.3,
"r_x2": 526.0,
"r_y2": 141.4,
"r_x3": 508.5,
"r_y3": 141.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 510.4,
"t": 86.1,
"r": 523.7,
"b": 91.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 510.4,
"r_y0": 91.0,
"r_x1": 523.7,
"r_y1": 91.0,
"r_x2": 523.7,
"r_y2": 86.1,
"r_x3": 510.4,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "caption",
"id": 1,
"page_no": 11,
"cluster": {
"id": 1,
"label": "caption",
"bbox": {
"l": 50.1,
"t": 165.5,
"r": 545.1,
"b": 186.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 174.4,
"r_x1": 545.1,
"r_y1": 174.4,
"r_x2": 545.1,
"r_y2": 165.5,
"r_x3": 50.1,
"r_y3": 165.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,",
"orig": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 186.4,
"r_x1": 513.5,
"r_y1": 186.4,
"r_x2": 513.5,
"r_y2": 177.5,
"r_x3": 50.1,
"r_y3": 177.5,
"coord_origin": "TOPLEFT"
},
"text": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.",
"orig": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split, strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity."
},
{
"label": "list_item",
"id": 4,
"page_no": 11,
"cluster": {
"id": 4,
"label": "list_item",
"bbox": {
"l": 61.6,
"t": 210.9,
"r": 286.4,
"b": 231.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 219.8,
"r_x1": 71.1,
"r_y1": 219.8,
"r_x2": 71.1,
"r_y2": 210.9,
"r_x3": 61.6,
"r_y3": 210.9,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.5,
"r_y0": 219.8,
"r_x1": 286.4,
"r_y1": 219.8,
"r_x2": 286.4,
"r_y2": 210.9,
"r_x3": 73.5,
"r_y3": 210.9,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer output does not include the table cell con-",
"orig": "TableFormer output does not include the table cell con-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 231.8,
"r_x1": 87.5,
"r_y1": 231.8,
"r_x2": 87.5,
"r_y2": 222.9,
"r_x3": 70.0,
"r_y3": 222.9,
"coord_origin": "TOPLEFT"
},
"text": "tent.",
"orig": "tent.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 TableFormer output does not include the table cell content."
},
{
"label": "list_item",
"id": 3,
"page_no": 11,
"cluster": {
"id": 3,
"label": "list_item",
"bbox": {
"l": 61.6,
"t": 244.1,
"r": 286.4,
"b": 264.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 253.0,
"r_x1": 71.3,
"r_y1": 253.0,
"r_x2": 71.3,
"r_y2": 244.1,
"r_x3": 61.6,
"r_y3": 244.1,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.8,
"r_y0": 253.0,
"r_x1": 286.4,
"r_y1": 253.0,
"r_x2": 286.4,
"r_y2": 244.1,
"r_x3": 73.8,
"r_y3": 244.1,
"coord_origin": "TOPLEFT"
},
"text": "There are occasional inaccuracies in the predictions of",
"orig": "There are occasional inaccuracies in the predictions of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 264.9,
"r_x1": 150.4,
"r_y1": 264.9,
"r_x2": 150.4,
"r_y2": 256.0,
"r_x3": 70.0,
"r_y3": 256.0,
"coord_origin": "TOPLEFT"
},
"text": "the bounding boxes.",
"orig": "the bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 There are occasional inaccuracies in the predictions of the bounding boxes."
},
{
"label": "text",
"id": 0,
"page_no": 11,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 50.1,
"t": 279.2,
"r": 286.4,
"b": 395.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 288.1,
"r_x1": 286.4,
"r_y1": 288.1,
"r_x2": 286.4,
"r_y2": 279.2,
"r_x3": 62.1,
"r_y3": 279.2,
"coord_origin": "TOPLEFT"
},
"text": "However, it is possible to mitigate those limitations by",
"orig": "However, it is possible to mitigate those limitations by",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 300.1,
"r_x1": 286.4,
"r_y1": 300.1,
"r_x2": 286.4,
"r_y2": 291.2,
"r_x3": 50.1,
"r_y3": 291.2,
"coord_origin": "TOPLEFT"
},
"text": "combining the TableFormer predictions with the informa-",
"orig": "combining the TableFormer predictions with the informa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 312.0,
"r_x1": 286.4,
"r_y1": 312.0,
"r_x2": 286.4,
"r_y2": 303.1,
"r_x3": 50.1,
"r_y3": 303.1,
"coord_origin": "TOPLEFT"
},
"text": "tion already present inside a programmatic PDF document.",
"orig": "tion already present inside a programmatic PDF document.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 324.0,
"r_x1": 286.4,
"r_y1": 324.0,
"r_x2": 286.4,
"r_y2": 315.1,
"r_x3": 50.1,
"r_y3": 315.1,
"coord_origin": "TOPLEFT"
},
"text": "More specifically, PDF documents can be seen as a se-",
"orig": "More specifically, PDF documents can be seen as a se-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 335.9,
"r_x1": 286.4,
"r_y1": 335.9,
"r_x2": 286.4,
"r_y2": 327.0,
"r_x3": 50.1,
"r_y3": 327.0,
"coord_origin": "TOPLEFT"
},
"text": "quence of PDF cells where each cell is described by its con-",
"orig": "quence of PDF cells where each cell is described by its con-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 347.9,
"r_x1": 286.4,
"r_y1": 347.9,
"r_x2": 286.4,
"r_y2": 339.0,
"r_x3": 50.1,
"r_y3": 339.0,
"coord_origin": "TOPLEFT"
},
"text": "tent and bounding box. If we are able to associate the PDF",
"orig": "tent and bounding box. If we are able to associate the PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 359.8,
"r_x1": 286.4,
"r_y1": 359.8,
"r_x2": 286.4,
"r_y2": 350.9,
"r_x3": 50.1,
"r_y3": 350.9,
"coord_origin": "TOPLEFT"
},
"text": "cells with the predicted table cells, we can directly link the",
"orig": "cells with the predicted table cells, we can directly link the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 371.8,
"r_x1": 286.4,
"r_y1": 371.8,
"r_x2": 286.4,
"r_y2": 362.9,
"r_x3": 50.1,
"r_y3": 362.9,
"coord_origin": "TOPLEFT"
},
"text": "PDF cell content to the table cell structure and use the PDF",
"orig": "PDF cell content to the table cell structure and use the PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 383.8,
"r_x1": 286.4,
"r_y1": 383.8,
"r_x2": 286.4,
"r_y2": 374.8,
"r_x3": 50.1,
"r_y3": 374.8,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes to correct misalignments in the predicted",
"orig": "bounding boxes to correct misalignments in the predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 395.7,
"r_x1": 154.6,
"r_y1": 395.7,
"r_x2": 154.6,
"r_y2": 386.8,
"r_x3": 50.1,
"r_y3": 386.8,
"coord_origin": "TOPLEFT"
},
"text": "table cell bounding boxes.",
"orig": "table cell bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "However, it is possible to mitigate those limitations by combining the TableFormer predictions with the information already present inside a programmatic PDF document. More specifically, PDF documents can be seen as a sequence of PDF cells where each cell is described by its content and bounding box. If we are able to associate the PDF cells with the predicted table cells, we can directly link the PDF cell content to the table cell structure and use the PDF bounding boxes to correct misalignments in the predicted table cell bounding boxes."
},
{
"label": "text",
"id": 11,
"page_no": 11,
"cluster": {
"id": 11,
"label": "text",
"bbox": {
"l": 50.1,
"t": 399.1,
"r": 286.4,
"b": 419.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 408.0,
"r_x1": 286.4,
"r_y1": 408.0,
"r_x2": 286.4,
"r_y2": 399.1,
"r_x3": 62.1,
"r_y3": 399.1,
"coord_origin": "TOPLEFT"
},
"text": "Here is a step-by-step description of the prediction post-",
"orig": "Here is a step-by-step description of the prediction post-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 419.9,
"r_x1": 95.5,
"r_y1": 419.9,
"r_x2": 95.5,
"r_y2": 411.0,
"r_x3": 50.1,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "processing:",
"orig": "processing:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Here is a step-by-step description of the prediction postprocessing:"
},
{
"label": "list_item",
"id": 20,
"page_no": 11,
"cluster": {
"id": 20,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 423.3,
"r": 286.4,
"b": 456.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.83,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 432.2,
"r_x1": 69.4,
"r_y1": 432.2,
"r_x2": 69.4,
"r_y2": 423.3,
"r_x3": 62.1,
"r_y3": 423.3,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.8,
"r_y0": 432.2,
"r_x1": 286.4,
"r_y1": 432.2,
"r_x2": 286.4,
"r_y2": 423.3,
"r_x3": 71.8,
"r_y3": 423.3,
"coord_origin": "TOPLEFT"
},
"text": "Get the minimal grid dimensions - number of rows and",
"orig": "Get the minimal grid dimensions - number of rows and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 444.2,
"r_x1": 286.4,
"r_y1": 444.2,
"r_x2": 286.4,
"r_y2": 435.3,
"r_x3": 50.1,
"r_y3": 435.3,
"coord_origin": "TOPLEFT"
},
"text": "columns for the predicted table structure. This represents",
"orig": "columns for the predicted table structure. This represents",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 456.1,
"r_x1": 274.5,
"r_y1": 456.1,
"r_x2": 274.5,
"r_y2": 447.2,
"r_x3": 50.1,
"r_y3": 447.2,
"coord_origin": "TOPLEFT"
},
"text": "the most granular grid for the underlying table structure.",
"orig": "the most granular grid for the underlying table structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1. Get the minimal grid dimensions - number of rows and columns for the predicted table structure. This represents the most granular grid for the underlying table structure."
},
{
"label": "list_item",
"id": 2,
"page_no": 11,
"cluster": {
"id": 2,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 459.5,
"r": 286.4,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 468.4,
"r_x1": 69.5,
"r_y1": 468.4,
"r_x2": 69.5,
"r_y2": 459.5,
"r_x3": 62.1,
"r_y3": 459.5,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 77.4,
"r_y0": 468.4,
"r_x1": 286.4,
"r_y1": 468.4,
"r_x2": 286.4,
"r_y2": 459.5,
"r_x3": 77.4,
"r_y3": 459.5,
"coord_origin": "TOPLEFT"
},
"text": "Generate pair-wise matches between the bounding",
"orig": "Generate pair-wise matches between the bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 480.3,
"r_x1": 286.4,
"r_y1": 480.3,
"r_x2": 286.4,
"r_y2": 471.4,
"r_x3": 50.1,
"r_y3": 471.4,
"coord_origin": "TOPLEFT"
},
"text": "boxes of the PDF cells and the predicted cells. The Intersec-",
"orig": "boxes of the PDF cells and the predicted cells. The Intersec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 492.3,
"r_x1": 286.4,
"r_y1": 492.3,
"r_x2": 286.4,
"r_y2": 483.4,
"r_x3": 50.1,
"r_y3": 483.4,
"coord_origin": "TOPLEFT"
},
"text": "tion Over Union (IOU) metric is used to evaluate the quality",
"orig": "tion Over Union (IOU) metric is used to evaluate the quality",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 504.2,
"r_x1": 110.7,
"r_y1": 504.2,
"r_x2": 110.7,
"r_y2": 495.3,
"r_x3": 50.1,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "of the matches.",
"orig": "of the matches.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "2. Generate pair-wise matches between the bounding boxes of the PDF cells and the predicted cells. The Intersection Over Union (IOU) metric is used to evaluate the quality of the matches."
},
{
"label": "list_item",
"id": 10,
"page_no": 11,
"cluster": {
"id": 10,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 507.6,
"r": 286.4,
"b": 528.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 516.5,
"r_x1": 69.9,
"r_y1": 516.5,
"r_x2": 69.9,
"r_y2": 507.6,
"r_x3": 62.1,
"r_y3": 507.6,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 72.5,
"r_y0": 516.5,
"r_x1": 286.4,
"r_y1": 516.5,
"r_x2": 286.4,
"r_y2": 507.6,
"r_x3": 72.5,
"r_y3": 507.6,
"coord_origin": "TOPLEFT"
},
"text": "Use a carefully selected IOU threshold to designate",
"orig": "Use a carefully selected IOU threshold to designate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 528.5,
"r_x1": 226.1,
"r_y1": 528.5,
"r_x2": 226.1,
"r_y2": 519.6,
"r_x3": 50.1,
"r_y3": 519.6,
"coord_origin": "TOPLEFT"
},
"text": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.",
"orig": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "3. Use a carefully selected IOU threshold to designate the matches as \"good\" ones and \"bad\" ones."
},
{
"label": "list_item",
"id": 8,
"page_no": 11,
"cluster": {
"id": 8,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 531.8,
"r": 286.4,
"b": 564.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 540.7,
"r_x1": 286.4,
"r_y1": 540.7,
"r_x2": 286.4,
"r_y2": 531.8,
"r_x3": 62.1,
"r_y3": 531.8,
"coord_origin": "TOPLEFT"
},
"text": "3.a. If all IOU scores in a column are below the thresh-",
"orig": "3.a. If all IOU scores in a column are below the thresh-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 552.7,
"r_x1": 286.4,
"r_y1": 552.7,
"r_x2": 286.4,
"r_y2": 543.8,
"r_x3": 50.1,
"r_y3": 543.8,
"coord_origin": "TOPLEFT"
},
"text": "old, discard all predictions (structure and bounding boxes)",
"orig": "old, discard all predictions (structure and bounding boxes)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 564.7,
"r_x1": 114.0,
"r_y1": 564.7,
"r_x2": 114.0,
"r_y2": 555.7,
"r_x3": 50.1,
"r_y3": 555.7,
"coord_origin": "TOPLEFT"
},
"text": "for that column.",
"orig": "for that column.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "3.a. If all IOU scores in a column are below the threshold, discard all predictions (structure and bounding boxes) for that column."
},
{
"label": "list_item",
"id": 5,
"page_no": 11,
"cluster": {
"id": 5,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 568.0,
"r": 286.4,
"b": 600.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 576.9,
"r_x1": 69.5,
"r_y1": 576.9,
"r_x2": 69.5,
"r_y2": 568.0,
"r_x3": 62.1,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.7,
"r_y0": 576.9,
"r_x1": 286.4,
"r_y1": 576.9,
"r_x2": 286.4,
"r_y2": 568.0,
"r_x3": 76.7,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "Find the best-fitting content alignment for the pre-",
"orig": "Find the best-fitting content alignment for the pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 588.9,
"r_x1": 286.4,
"r_y1": 588.9,
"r_x2": 286.4,
"r_y2": 580.0,
"r_x3": 50.1,
"r_y3": 580.0,
"coord_origin": "TOPLEFT"
},
"text": "dicted cells with good IOU per each column. The alignment",
"orig": "dicted cells with good IOU per each column. The alignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 600.8,
"r_x1": 278.7,
"r_y1": 600.8,
"r_x2": 278.7,
"r_y2": 591.9,
"r_x3": 50.1,
"r_y3": 591.9,
"coord_origin": "TOPLEFT"
},
"text": "of the column can be identified by the following formula:",
"orig": "of the column can be identified by the following formula:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "4. Find the best-fitting content alignment for the predicted cells with good IOU per each column. The alignment of the column can be identified by the following formula:"
},
{
"label": "formula",
"id": 12,
"page_no": 11,
"cluster": {
"id": 12,
"label": "formula",
"bbox": {
"l": 110.7,
"t": 623.4,
"r": 286.4,
"b": 654.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.0,
"r_y0": 632.8,
"r_x1": 158.0,
"r_y1": 632.8,
"r_x2": 158.0,
"r_y2": 624.0,
"r_x3": 112.0,
"r_y3": 624.0,
"coord_origin": "TOPLEFT"
},
"text": "alignment",
"orig": "alignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.7,
"r_y0": 632.8,
"r_x1": 203.5,
"r_y1": 632.8,
"r_x2": 203.5,
"r_y2": 624.0,
"r_x3": 160.7,
"r_y3": 624.0,
"coord_origin": "TOPLEFT"
},
"text": "= arg min",
"orig": "= arg min",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.6,
"r_y0": 640.2,
"r_x1": 189.1,
"r_y1": 640.2,
"r_x2": 189.1,
"r_y2": 634.0,
"r_x3": 185.6,
"r_y3": 634.0,
"coord_origin": "TOPLEFT"
},
"text": "c",
"orig": "c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 203.5,
"r_y0": 632.8,
"r_x1": 208.5,
"r_y1": 632.8,
"r_x2": 208.5,
"r_y2": 623.4,
"r_x3": 203.5,
"r_y3": 623.4,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.5,
"r_y0": 632.8,
"r_x1": 220.3,
"r_y1": 632.8,
"r_x2": 220.3,
"r_y2": 624.0,
"r_x3": 208.5,
"r_y3": 624.0,
"coord_origin": "TOPLEFT"
},
"text": "D$_{c}$",
"orig": "D$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 632.8,
"r_x1": 225.8,
"r_y1": 632.8,
"r_x2": 225.8,
"r_y2": 623.4,
"r_x3": 220.8,
"r_y3": 623.4,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.7,
"r_y0": 654.1,
"r_x1": 122.5,
"r_y1": 654.1,
"r_x2": 122.5,
"r_y2": 645.3,
"r_x3": 110.7,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "D$_{c}$",
"orig": "D$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.8,
"r_y0": 654.1,
"r_x1": 133.5,
"r_y1": 654.1,
"r_x2": 133.5,
"r_y2": 645.3,
"r_x3": 125.8,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 136.3,
"r_y0": 654.1,
"r_x1": 156.0,
"r_y1": 654.1,
"r_x2": 156.0,
"r_y2": 645.3,
"r_x3": 136.3,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "max",
"orig": "max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 156.0,
"r_y0": 654.1,
"r_x1": 161.0,
"r_y1": 654.1,
"r_x2": 161.0,
"r_y2": 644.7,
"r_x3": 156.0,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 161.0,
"r_y0": 654.1,
"r_x1": 170.2,
"r_y1": 654.1,
"r_x2": 170.2,
"r_y2": 645.3,
"r_x3": 161.0,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 170.7,
"r_y0": 654.1,
"r_x1": 185.7,
"r_y1": 654.1,
"r_x2": 185.7,
"r_y2": 644.7,
"r_x3": 170.7,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "} \u2212",
"orig": "} \u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.9,
"r_y0": 654.1,
"r_x1": 206.1,
"r_y1": 654.1,
"r_x2": 206.1,
"r_y2": 645.3,
"r_x3": 187.9,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "min",
"orig": "min",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.1,
"r_y0": 654.1,
"r_x1": 211.0,
"r_y1": 654.1,
"r_x2": 211.0,
"r_y2": 644.7,
"r_x3": 206.1,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.0,
"r_y0": 654.1,
"r_x1": 220.3,
"r_y1": 654.1,
"r_x2": 220.3,
"r_y2": 645.3,
"r_x3": 211.0,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 654.1,
"r_x1": 225.8,
"r_y1": 654.1,
"r_x2": 225.8,
"r_y2": 644.7,
"r_x3": 220.8,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.7,
"r_y0": 643.8,
"r_x1": 286.4,
"r_y1": 643.8,
"r_x2": 286.4,
"r_y2": 634.9,
"r_x3": 274.7,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "(4)",
"orig": "(4)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "alignment = arg min c { D$_{c}$ } D$_{c}$ = max { x$_{c}$ } \u2212 min { x$_{c}$ } (4)"
},
{
"label": "text",
"id": 7,
"page_no": 11,
"cluster": {
"id": 7,
"label": "text",
"bbox": {
"l": 50.1,
"t": 667.3,
"r": 286.4,
"b": 688.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.0,
"r_x1": 74.5,
"r_y1": 677.0,
"r_x2": 74.5,
"r_y2": 668.1,
"r_x3": 50.1,
"r_y3": 668.1,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.3,
"r_y0": 676.8,
"r_x1": 82.6,
"r_y1": 676.8,
"r_x2": 82.6,
"r_y2": 667.9,
"r_x3": 78.3,
"r_y3": 667.9,
"coord_origin": "TOPLEFT"
},
"text": "c",
"orig": "c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.5,
"r_y0": 677.0,
"r_x1": 123.6,
"r_y1": 677.0,
"r_x2": 123.6,
"r_y2": 668.1,
"r_x3": 86.5,
"r_y3": 668.1,
"coord_origin": "TOPLEFT"
},
"text": "is one of",
"orig": "is one of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 127.5,
"r_y0": 676.8,
"r_x1": 132.5,
"r_y1": 676.8,
"r_x2": 132.5,
"r_y2": 667.3,
"r_x3": 127.5,
"r_y3": 667.3,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 132.5,
"r_y0": 677.0,
"r_x1": 210.7,
"r_y1": 677.0,
"r_x2": 210.7,
"r_y2": 668.1,
"r_x3": 132.5,
"r_y3": 668.1,
"coord_origin": "TOPLEFT"
},
"text": "left, centroid, right",
"orig": "left, centroid, right",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.7,
"r_y0": 676.8,
"r_x1": 215.7,
"r_y1": 676.8,
"r_x2": 215.7,
"r_y2": 667.3,
"r_x3": 210.7,
"r_y3": 667.3,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 219.6,
"r_y0": 677.0,
"r_x1": 233.9,
"r_y1": 677.0,
"r_x2": 233.9,
"r_y2": 668.1,
"r_x3": 219.6,
"r_y3": 668.1,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 237.8,
"r_y0": 676.8,
"r_x1": 247.1,
"r_y1": 676.8,
"r_x2": 247.1,
"r_y2": 667.9,
"r_x3": 237.8,
"r_y3": 667.9,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 251.5,
"r_y0": 677.0,
"r_x1": 286.4,
"r_y1": 677.0,
"r_x2": 286.4,
"r_y2": 668.1,
"r_x3": 251.5,
"r_y3": 668.1,
"coord_origin": "TOPLEFT"
},
"text": "is the x-",
"orig": "is the x-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 688.9,
"r_x1": 205.9,
"r_y1": 688.9,
"r_x2": 205.9,
"r_y2": 680.0,
"r_x3": 50.1,
"r_y3": 680.0,
"coord_origin": "TOPLEFT"
},
"text": "coordinate for the corresponding point.",
"orig": "coordinate for the corresponding point.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "where c is one of { left, centroid, right } and x$_{c}$ is the xcoordinate for the corresponding point."
},
{
"label": "list_item",
"id": 13,
"page_no": 11,
"cluster": {
"id": 13,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 692.3,
"r": 286.4,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 701.2,
"r_x1": 69.5,
"r_y1": 701.2,
"r_x2": 69.5,
"r_y2": 692.3,
"r_x3": 62.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.3,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 76.3,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "Use the alignment computed in step 4, to compute",
"orig": "Use the alignment computed in step 4, to compute",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 94.6,
"r_y1": 713.2,
"r_x2": 94.6,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "the median",
"orig": "the median",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 97.6,
"r_y0": 712.9,
"r_x1": 103.3,
"r_y1": 712.9,
"r_x2": 103.3,
"r_y2": 704.1,
"r_x3": 97.6,
"r_y3": 704.1,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.3,
"r_y0": 713.2,
"r_x1": 286.4,
"r_y1": 713.2,
"r_x2": 286.4,
"r_y2": 704.2,
"r_x3": 103.3,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "-coordinate for all table columns and the me-",
"orig": "-coordinate for all table columns and the me-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5. Use the alignment computed in step 4, to compute the median x -coordinate for all table columns and the me-"
},
{
"label": "text",
"id": 16,
"page_no": 11,
"cluster": {
"id": 16,
"label": "text",
"bbox": {
"l": 308.9,
"t": 210.9,
"r": 545.1,
"b": 255.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 219.8,
"r_x1": 545.1,
"r_y1": 219.8,
"r_x2": 545.1,
"r_y2": 210.9,
"r_x3": 308.9,
"r_y3": 210.9,
"coord_origin": "TOPLEFT"
},
"text": "dian cell size for all table cells. The usage of median dur-",
"orig": "dian cell size for all table cells. The usage of median dur-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 231.8,
"r_x1": 545.1,
"r_y1": 231.8,
"r_x2": 545.1,
"r_y2": 222.9,
"r_x3": 308.9,
"r_y3": 222.9,
"coord_origin": "TOPLEFT"
},
"text": "ing the computations, helps to eliminate outliers caused by",
"orig": "ing the computations, helps to eliminate outliers caused by",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 243.7,
"r_x1": 545.1,
"r_y1": 243.7,
"r_x2": 545.1,
"r_y2": 234.8,
"r_x3": 308.9,
"r_y3": 234.8,
"coord_origin": "TOPLEFT"
},
"text": "occasional column spans which are usually wider than the",
"orig": "occasional column spans which are usually wider than the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 255.7,
"r_x1": 339.6,
"r_y1": 255.7,
"r_x2": 339.6,
"r_y2": 246.8,
"r_x3": 308.9,
"r_y3": 246.8,
"coord_origin": "TOPLEFT"
},
"text": "normal.",
"orig": "normal.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "dian cell size for all table cells. The usage of median during the computations, helps to eliminate outliers caused by occasional column spans which are usually wider than the normal."
},
{
"label": "list_item",
"id": 9,
"page_no": 11,
"cluster": {
"id": 9,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 259.1,
"r": 545.1,
"b": 280.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 268.0,
"r_x1": 328.3,
"r_y1": 268.0,
"r_x2": 328.3,
"r_y2": 259.1,
"r_x3": 320.8,
"r_y3": 259.1,
"coord_origin": "TOPLEFT"
},
"text": "6.",
"orig": "6.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 334.9,
"r_y0": 268.0,
"r_x1": 545.1,
"r_y1": 268.0,
"r_x2": 545.1,
"r_y2": 259.1,
"r_x3": 334.9,
"r_y3": 259.1,
"coord_origin": "TOPLEFT"
},
"text": "Snap all cells with bad IOU to their corresponding",
"orig": "Snap all cells with bad IOU to their corresponding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 280.0,
"r_x1": 338.2,
"r_y1": 280.0,
"r_x2": 338.2,
"r_y2": 271.1,
"r_x3": 308.9,
"r_y3": 271.1,
"coord_origin": "TOPLEFT"
},
"text": "median",
"orig": "median",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 340.7,
"r_y0": 279.7,
"r_x1": 346.4,
"r_y1": 279.7,
"r_x2": 346.4,
"r_y2": 270.9,
"r_x3": 340.7,
"r_y3": 270.9,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.4,
"r_y0": 280.0,
"r_x1": 453.7,
"r_y1": 280.0,
"r_x2": 453.7,
"r_y2": 271.1,
"r_x3": 346.4,
"r_y3": 271.1,
"coord_origin": "TOPLEFT"
},
"text": "-coordinates and cell sizes.",
"orig": "-coordinates and cell sizes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "6. Snap all cells with bad IOU to their corresponding median x -coordinates and cell sizes."
},
{
"label": "list_item",
"id": 6,
"page_no": 11,
"cluster": {
"id": 6,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 283.4,
"r": 545.1,
"b": 387.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 292.3,
"r_x1": 328.4,
"r_y1": 292.3,
"r_x2": 328.4,
"r_y2": 283.4,
"r_x3": 320.8,
"r_y3": 283.4,
"coord_origin": "TOPLEFT"
},
"text": "7.",
"orig": "7.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.9,
"r_y0": 292.3,
"r_x1": 545.1,
"r_y1": 292.3,
"r_x2": 545.1,
"r_y2": 283.4,
"r_x3": 330.9,
"r_y3": 283.4,
"coord_origin": "TOPLEFT"
},
"text": "Generate a new set of pair-wise matches between the",
"orig": "Generate a new set of pair-wise matches between the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 304.2,
"r_x1": 545.1,
"r_y1": 304.2,
"r_x2": 545.1,
"r_y2": 295.3,
"r_x3": 308.9,
"r_y3": 295.3,
"coord_origin": "TOPLEFT"
},
"text": "corrected bounding boxes and PDF cells. This time use a",
"orig": "corrected bounding boxes and PDF cells. This time use a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 316.2,
"r_x1": 545.1,
"r_y1": 316.2,
"r_x2": 545.1,
"r_y2": 307.3,
"r_x3": 308.9,
"r_y3": 307.3,
"coord_origin": "TOPLEFT"
},
"text": "modified version of the IOU metric, where the area of the",
"orig": "modified version of the IOU metric, where the area of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 328.1,
"r_x1": 545.1,
"r_y1": 328.1,
"r_x2": 545.1,
"r_y2": 319.2,
"r_x3": 308.9,
"r_y3": 319.2,
"coord_origin": "TOPLEFT"
},
"text": "intersection between the predicted and PDF cells is divided",
"orig": "intersection between the predicted and PDF cells is divided",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 340.1,
"r_x1": 397.2,
"r_y1": 340.1,
"r_x2": 397.2,
"r_y2": 331.2,
"r_x3": 308.9,
"r_y3": 331.2,
"coord_origin": "TOPLEFT"
},
"text": "by the PDF cell area.",
"orig": "by the PDF cell area.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.7,
"r_y0": 340.1,
"r_x1": 545.1,
"r_y1": 340.1,
"r_x2": 545.1,
"r_y2": 331.2,
"r_x3": 403.7,
"r_y3": 331.2,
"coord_origin": "TOPLEFT"
},
"text": "In case there are multiple matches",
"orig": "In case there are multiple matches",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 352.0,
"r_x1": 545.1,
"r_y1": 352.0,
"r_x2": 545.1,
"r_y2": 343.1,
"r_x3": 308.9,
"r_y3": 343.1,
"coord_origin": "TOPLEFT"
},
"text": "for the same PDF cell, the prediction with the higher score",
"orig": "for the same PDF cell, the prediction with the higher score",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 364.0,
"r_x1": 545.1,
"r_y1": 364.0,
"r_x2": 545.1,
"r_y2": 355.1,
"r_x3": 308.9,
"r_y3": 355.1,
"coord_origin": "TOPLEFT"
},
"text": "is preferred. This covers the cases where the PDF cells are",
"orig": "is preferred. This covers the cases where the PDF cells are",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 376.0,
"r_x1": 545.1,
"r_y1": 376.0,
"r_x2": 545.1,
"r_y2": 367.0,
"r_x3": 308.9,
"r_y3": 367.0,
"coord_origin": "TOPLEFT"
},
"text": "smaller than the area of predicted or corrected prediction",
"orig": "smaller than the area of predicted or corrected prediction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 387.9,
"r_x1": 329.6,
"r_y1": 387.9,
"r_x2": 329.6,
"r_y2": 379.0,
"r_x3": 308.9,
"r_y3": 379.0,
"coord_origin": "TOPLEFT"
},
"text": "cells.",
"orig": "cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "7. Generate a new set of pair-wise matches between the corrected bounding boxes and PDF cells. This time use a modified version of the IOU metric, where the area of the intersection between the predicted and PDF cells is divided by the PDF cell area. In case there are multiple matches for the same PDF cell, the prediction with the higher score is preferred. This covers the cases where the PDF cells are smaller than the area of predicted or corrected prediction cells."
},
{
"label": "list_item",
"id": 17,
"page_no": 11,
"cluster": {
"id": 17,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 391.3,
"r": 545.1,
"b": 460.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.87,
"cells": [
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 400.2,
"r_x1": 328.6,
"r_y1": 400.2,
"r_x2": 328.6,
"r_y2": 391.3,
"r_x3": 320.8,
"r_y3": 391.3,
"coord_origin": "TOPLEFT"
},
"text": "8.",
"orig": "8.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.1,
"r_y0": 400.2,
"r_x1": 545.1,
"r_y1": 400.2,
"r_x2": 545.1,
"r_y2": 391.3,
"r_x3": 331.1,
"r_y3": 391.3,
"coord_origin": "TOPLEFT"
},
"text": "In some rare occasions, we have noticed that Table-",
"orig": "In some rare occasions, we have noticed that Table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 412.2,
"r_x1": 545.1,
"r_y1": 412.2,
"r_x2": 545.1,
"r_y2": 403.3,
"r_x3": 308.9,
"r_y3": 403.3,
"coord_origin": "TOPLEFT"
},
"text": "Former can confuse a single column as two. When the post-",
"orig": "Former can confuse a single column as two. When the post-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 424.1,
"r_x1": 545.1,
"r_y1": 424.1,
"r_x2": 545.1,
"r_y2": 415.2,
"r_x3": 308.9,
"r_y3": 415.2,
"coord_origin": "TOPLEFT"
},
"text": "processing steps are applied, this results with two predicted",
"orig": "processing steps are applied, this results with two predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 436.1,
"r_x1": 545.1,
"r_y1": 436.1,
"r_x2": 545.1,
"r_y2": 427.2,
"r_x3": 308.9,
"r_y3": 427.2,
"coord_origin": "TOPLEFT"
},
"text": "columns pointing to the same PDF column. In such case",
"orig": "columns pointing to the same PDF column. In such case",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 448.0,
"r_x1": 545.1,
"r_y1": 448.0,
"r_x2": 545.1,
"r_y2": 439.1,
"r_x3": 308.9,
"r_y3": 439.1,
"coord_origin": "TOPLEFT"
},
"text": "we must de-duplicate the columns according to highest to-",
"orig": "we must de-duplicate the columns according to highest to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 460.0,
"r_x1": 426.2,
"r_y1": 460.0,
"r_x2": 426.2,
"r_y2": 451.1,
"r_x3": 308.9,
"r_y3": 451.1,
"coord_origin": "TOPLEFT"
},
"text": "tal column intersection score.",
"orig": "tal column intersection score.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "8. In some rare occasions, we have noticed that TableFormer can confuse a single column as two. When the postprocessing steps are applied, this results with two predicted columns pointing to the same PDF column. In such case we must de-duplicate the columns according to highest total column intersection score."
},
{
"label": "list_item",
"id": 15,
"page_no": 11,
"cluster": {
"id": 15,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 463.4,
"r": 545.1,
"b": 567.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 472.3,
"r_x1": 328.7,
"r_y1": 472.3,
"r_x2": 328.7,
"r_y2": 463.4,
"r_x3": 320.8,
"r_y3": 463.4,
"coord_origin": "TOPLEFT"
},
"text": "9.",
"orig": "9.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.3,
"r_y0": 472.3,
"r_x1": 545.1,
"r_y1": 472.3,
"r_x2": 545.1,
"r_y2": 463.4,
"r_x3": 331.3,
"r_y3": 463.4,
"coord_origin": "TOPLEFT"
},
"text": "Pick up the remaining orphan cells. There could be",
"orig": "Pick up the remaining orphan cells. There could be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 484.3,
"r_x1": 545.1,
"r_y1": 484.3,
"r_x2": 545.1,
"r_y2": 475.3,
"r_x3": 308.9,
"r_y3": 475.3,
"coord_origin": "TOPLEFT"
},
"text": "cases, when after applying all the previous post-processing",
"orig": "cases, when after applying all the previous post-processing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 496.2,
"r_x1": 545.1,
"r_y1": 496.2,
"r_x2": 545.1,
"r_y2": 487.3,
"r_x3": 308.9,
"r_y3": 487.3,
"coord_origin": "TOPLEFT"
},
"text": "steps, some PDF cells could still remain without any match",
"orig": "steps, some PDF cells could still remain without any match",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 508.2,
"r_x1": 381.9,
"r_y1": 508.2,
"r_x2": 381.9,
"r_y2": 499.3,
"r_x3": 308.9,
"r_y3": 499.3,
"coord_origin": "TOPLEFT"
},
"text": "to predicted cells.",
"orig": "to predicted cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 388.7,
"r_y0": 508.2,
"r_x1": 545.1,
"r_y1": 508.2,
"r_x2": 545.1,
"r_y2": 499.3,
"r_x3": 388.7,
"r_y3": 499.3,
"coord_origin": "TOPLEFT"
},
"text": "However, it is still possible to deduce",
"orig": "However, it is still possible to deduce",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 520.1,
"r_x1": 545.1,
"r_y1": 520.1,
"r_x2": 545.1,
"r_y2": 511.2,
"r_x3": 308.9,
"r_y3": 511.2,
"coord_origin": "TOPLEFT"
},
"text": "the correct matching for an orphan PDF cell by mapping its",
"orig": "the correct matching for an orphan PDF cell by mapping its",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 532.1,
"r_x1": 545.1,
"r_y1": 532.1,
"r_x2": 545.1,
"r_y2": 523.2,
"r_x3": 308.9,
"r_y3": 523.2,
"coord_origin": "TOPLEFT"
},
"text": "bounding box on the geometry of the grid. This mapping",
"orig": "bounding box on the geometry of the grid. This mapping",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 544.0,
"r_x1": 545.1,
"r_y1": 544.0,
"r_x2": 545.1,
"r_y2": 535.1,
"r_x3": 308.9,
"r_y3": 535.1,
"coord_origin": "TOPLEFT"
},
"text": "decides if the content of the orphan cell will be appended to",
"orig": "decides if the content of the orphan cell will be appended to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 556.0,
"r_x1": 545.1,
"r_y1": 556.0,
"r_x2": 545.1,
"r_y2": 547.1,
"r_x3": 308.9,
"r_y3": 547.1,
"coord_origin": "TOPLEFT"
},
"text": "an already matched table cell, or a new table cell should be",
"orig": "an already matched table cell, or a new table cell should be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 567.9,
"r_x1": 442.2,
"r_y1": 567.9,
"r_x2": 442.2,
"r_y2": 559.0,
"r_x3": 308.9,
"r_y3": 559.0,
"coord_origin": "TOPLEFT"
},
"text": "created to match with the orphan.",
"orig": "created to match with the orphan.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9. Pick up the remaining orphan cells. There could be cases, when after applying all the previous post-processing steps, some PDF cells could still remain without any match to predicted cells. However, it is still possible to deduce the correct matching for an orphan PDF cell by mapping its bounding box on the geometry of the grid. This mapping decides if the content of the orphan cell will be appended to an already matched table cell, or a new table cell should be created to match with the orphan."
},
{
"label": "text",
"id": 19,
"page_no": 11,
"cluster": {
"id": 19,
"label": "text",
"bbox": {
"l": 308.9,
"t": 571.3,
"r": 545.1,
"b": 604.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.85,
"cells": [
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 580.2,
"r_x1": 545.1,
"r_y1": 580.2,
"r_x2": 545.1,
"r_y2": 571.3,
"r_x3": 320.8,
"r_y3": 571.3,
"coord_origin": "TOPLEFT"
},
"text": "9a. Compute the top and bottom boundary of the hori-",
"orig": "9a. Compute the top and bottom boundary of the hori-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 592.2,
"r_x1": 471.6,
"r_y1": 592.2,
"r_x2": 471.6,
"r_y2": 583.3,
"r_x3": 308.9,
"r_y3": 583.3,
"coord_origin": "TOPLEFT"
},
"text": "zontal band for each grid row (min/max",
"orig": "zontal band for each grid row (min/max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 474.8,
"r_y0": 592.0,
"r_x1": 479.7,
"r_y1": 592.0,
"r_x2": 479.7,
"r_y2": 583.1,
"r_x3": 474.8,
"r_y3": 583.1,
"coord_origin": "TOPLEFT"
},
"text": "y",
"orig": "y",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.3,
"r_y0": 592.2,
"r_x1": 545.1,
"r_y1": 592.2,
"r_x2": 545.1,
"r_y2": 583.3,
"r_x3": 483.3,
"r_y3": 583.3,
"coord_origin": "TOPLEFT"
},
"text": "coordinates per",
"orig": "coordinates per",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 604.2,
"r_x1": 329.9,
"r_y1": 604.2,
"r_x2": 329.9,
"r_y2": 595.2,
"r_x3": 308.9,
"r_y3": 595.2,
"coord_origin": "TOPLEFT"
},
"text": "row).",
"orig": "row).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9a. Compute the top and bottom boundary of the horizontal band for each grid row (min/max y coordinates per row)."
},
{
"label": "list_item",
"id": 21,
"page_no": 11,
"cluster": {
"id": 21,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 607.6,
"r": 545.1,
"b": 628.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.77,
"cells": [
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 616.5,
"r_x1": 332.9,
"r_y1": 616.5,
"r_x2": 332.9,
"r_y2": 607.6,
"r_x3": 320.8,
"r_y3": 607.6,
"coord_origin": "TOPLEFT"
},
"text": "9b.",
"orig": "9b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.9,
"r_y0": 616.5,
"r_x1": 545.1,
"r_y1": 616.5,
"r_x2": 545.1,
"r_y2": 607.6,
"r_x3": 339.9,
"r_y3": 607.6,
"coord_origin": "TOPLEFT"
},
"text": "Intersect the orphan\u2019s bounding box with the row",
"orig": "Intersect the orphan\u2019s bounding box with the row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 628.4,
"r_x1": 495.3,
"r_y1": 628.4,
"r_x2": 495.3,
"r_y2": 619.5,
"r_x3": 308.9,
"r_y3": 619.5,
"coord_origin": "TOPLEFT"
},
"text": "bands, and map the cell to the closest grid row.",
"orig": "bands, and map the cell to the closest grid row.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9b. Intersect the orphan's bounding box with the row bands, and map the cell to the closest grid row."
},
{
"label": "list_item",
"id": 18,
"page_no": 11,
"cluster": {
"id": 18,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 631.8,
"r": 545.1,
"b": 664.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.86,
"cells": [
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 640.7,
"r_x1": 545.1,
"r_y1": 640.7,
"r_x2": 545.1,
"r_y2": 631.8,
"r_x3": 320.8,
"r_y3": 631.8,
"coord_origin": "TOPLEFT"
},
"text": "9c. Compute the left and right boundary of the vertical",
"orig": "9c. Compute the left and right boundary of the vertical",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 652.7,
"r_x1": 455.3,
"r_y1": 652.7,
"r_x2": 455.3,
"r_y2": 643.8,
"r_x3": 308.9,
"r_y3": 643.8,
"coord_origin": "TOPLEFT"
},
"text": "band for each grid column (min/max",
"orig": "band for each grid column (min/max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 457.8,
"r_y0": 652.5,
"r_x1": 463.5,
"r_y1": 652.5,
"r_x2": 463.5,
"r_y2": 643.6,
"r_x3": 457.8,
"r_y3": 643.6,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.0,
"r_y0": 652.7,
"r_x1": 545.1,
"r_y1": 652.7,
"r_x2": 545.1,
"r_y2": 643.8,
"r_x3": 466.0,
"r_y3": 643.8,
"coord_origin": "TOPLEFT"
},
"text": "coordinates per col-",
"orig": "coordinates per col-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 664.6,
"r_x1": 332.4,
"r_y1": 664.6,
"r_x2": 332.4,
"r_y2": 655.7,
"r_x3": 308.9,
"r_y3": 655.7,
"coord_origin": "TOPLEFT"
},
"text": "umn).",
"orig": "umn).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9c. Compute the left and right boundary of the vertical band for each grid column (min/max x coordinates per column)."
},
{
"label": "list_item",
"id": 22,
"page_no": 11,
"cluster": {
"id": 22,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 668.0,
"r": 545.1,
"b": 688.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.76,
"cells": [
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 676.9,
"r_x1": 545.1,
"r_y1": 676.9,
"r_x2": 545.1,
"r_y2": 668.0,
"r_x3": 320.8,
"r_y3": 668.0,
"coord_origin": "TOPLEFT"
},
"text": "9d. Intersect the orphan\u2019s bounding box with the column",
"orig": "9d. Intersect the orphan\u2019s bounding box with the column",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 688.9,
"r_x1": 510.6,
"r_y1": 688.9,
"r_x2": 510.6,
"r_y2": 680.0,
"r_x3": 308.9,
"r_y3": 680.0,
"coord_origin": "TOPLEFT"
},
"text": "bands, and map the cell to the closest grid column.",
"orig": "bands, and map the cell to the closest grid column.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9d. Intersect the orphan's bounding box with the column bands, and map the cell to the closest grid column."
},
{
"label": "list_item",
"id": 25,
"page_no": 11,
"cluster": {
"id": 25,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 692.3,
"r": 545.1,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.7,
"cells": [
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 320.8,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "9e. If the table cell under the identified row and column",
"orig": "9e. If the table cell under the identified row and column",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 545.1,
"r_y1": 713.2,
"r_x2": 545.1,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "is not empty, extend its content with the content of the or-",
"orig": "is not empty, extend its content with the content of the or-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9e. If the table cell under the identified row and column is not empty, extend its content with the content of the or-"
},
{
"label": "page_footer",
"id": 14,
"page_no": 11,
"cluster": {
"id": 14,
"label": "page_footer",
"bbox": {
"l": 292.6,
"t": 734.1,
"r": 302.6,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "12"
}
],
"body": [
{
"label": "picture",
"id": 30,
"page_no": 11,
"cluster": {
"id": 30,
"label": "picture",
"bbox": {
"l": 53.5,
"t": 74.7,
"r": 544.9,
"b": 147.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.6,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.4,
"r_y0": 83.3,
"r_x1": 151.9,
"r_y1": 83.3,
"r_x2": 151.9,
"r_y2": 77.3,
"r_x3": 119.4,
"r_y3": 77.3,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.3,
"r_y0": 81.1,
"r_x1": 59.3,
"r_y1": 81.1,
"r_x2": 59.3,
"r_y2": 75.2,
"r_x3": 53.3,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.6,
"r_y0": 83.4,
"r_x1": 319.8,
"r_y1": 83.4,
"r_x2": 319.8,
"r_y2": 77.5,
"r_x3": 289.6,
"r_y3": 77.5,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.4,
"r_y0": 83.2,
"r_x1": 481.8,
"r_y1": 83.2,
"r_x2": 481.8,
"r_y2": 77.3,
"r_x3": 448.4,
"r_y3": 77.3,
"coord_origin": "TOPLEFT"
},
"text": "Table Bank",
"orig": "Table Bank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.6,
"r_y0": 146.2,
"r_x1": 95.0,
"r_y1": 146.2,
"r_x2": 95.0,
"r_y2": 141.3,
"r_x3": 82.6,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Train",
"orig": "Train",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 63.0,
"r_y0": 106.1,
"r_x1": 85.3,
"r_y1": 106.1,
"r_x2": 85.3,
"r_y2": 101.1,
"r_x3": 63.0,
"r_y3": 101.1,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 129.4,
"r_x1": 85.2,
"r_y1": 129.4,
"r_x2": 85.2,
"r_y2": 124.4,
"r_x3": 67.8,
"r_y3": 124.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.6,
"r_y0": 107.5,
"r_x1": 249.8,
"r_y1": 107.5,
"r_x2": 249.8,
"r_y2": 102.5,
"r_x3": 227.6,
"r_y3": 102.5,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.2,
"r_y0": 131.9,
"r_x1": 249.7,
"r_y1": 131.9,
"r_x2": 249.7,
"r_y2": 127.0,
"r_x3": 232.2,
"r_y3": 127.0,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 119.0,
"r_x1": 413.7,
"r_y1": 119.0,
"r_x2": 413.7,
"r_y2": 114.0,
"r_x3": 396.2,
"r_y3": 114.0,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 97.4,
"r_y0": 146.2,
"r_x1": 105.1,
"r_y1": 146.2,
"r_x2": 105.1,
"r_y2": 141.3,
"r_x3": 97.4,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Val",
"orig": "Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.9,
"r_y0": 90.7,
"r_x1": 76.2,
"r_y1": 90.7,
"r_x2": 76.2,
"r_y2": 85.7,
"r_x3": 60.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.3,
"r_y0": 91.2,
"r_x1": 107.0,
"r_y1": 91.2,
"r_x2": 107.0,
"r_y2": 86.2,
"r_x3": 82.3,
"r_y3": 86.2,
"coord_origin": "TOPLEFT"
},
"text": "500K 10K",
"orig": "500K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.2,
"r_y0": 146.6,
"r_x1": 281.9,
"r_y1": 146.6,
"r_x2": 281.9,
"r_y2": 141.6,
"r_x3": 246.2,
"r_y3": 141.6,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 226.7,
"r_y0": 90.7,
"r_x1": 241.9,
"r_y1": 90.7,
"r_x2": 241.9,
"r_y2": 85.7,
"r_x3": 226.7,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 249.9,
"r_y0": 91.0,
"r_x1": 282.5,
"r_y1": 91.0,
"r_x2": 282.5,
"r_y2": 86.1,
"r_x3": 249.9,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "91K 10K 10K",
"orig": "91K 10K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.2,
"r_y0": 146.2,
"r_x1": 444.7,
"r_y1": 146.2,
"r_x2": 444.7,
"r_y2": 141.3,
"r_x3": 410.2,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.4,
"r_y0": 90.7,
"r_x1": 432.7,
"r_y1": 90.7,
"r_x2": 432.7,
"r_y2": 85.7,
"r_x3": 391.4,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "100% 130K 5K",
"orig": "100% 130K 5K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 435.6,
"r_y0": 91.2,
"r_x1": 445.6,
"r_y1": 91.2,
"r_x2": 445.6,
"r_y2": 86.3,
"r_x3": 435.6,
"r_y3": 86.3,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.9,
"r_y0": 146.2,
"r_x1": 136.2,
"r_y1": 146.2,
"r_x2": 136.2,
"r_y2": 141.3,
"r_x3": 113.9,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.9,
"r_y0": 99.8,
"r_x1": 127.1,
"r_y1": 99.8,
"r_x2": 127.1,
"r_y2": 94.8,
"r_x3": 116.9,
"r_y3": 94.8,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.3,
"r_y0": 105.9,
"r_x1": 127.1,
"r_y1": 105.9,
"r_x2": 127.1,
"r_y2": 100.9,
"r_x3": 113.3,
"r_y3": 100.9,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.9,
"r_y0": 112.0,
"r_x1": 127.1,
"r_y1": 112.0,
"r_x2": 127.1,
"r_y2": 107.1,
"r_x3": 112.9,
"r_y3": 107.1,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.2,
"r_y0": 127.6,
"r_x1": 127.0,
"r_y1": 127.6,
"r_x2": 127.0,
"r_y2": 122.6,
"r_x3": 113.2,
"r_y3": 122.6,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.9,
"r_y0": 133.7,
"r_x1": 127.0,
"r_y1": 133.7,
"r_x2": 127.0,
"r_y2": 128.7,
"r_x3": 112.9,
"r_y3": 128.7,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.6,
"r_y0": 146.4,
"r_x1": 156.0,
"r_y1": 146.4,
"r_x2": 156.0,
"r_y2": 141.4,
"r_x3": 138.6,
"r_y3": 141.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.0,
"r_y0": 91.2,
"r_x1": 151.0,
"r_y1": 91.2,
"r_x2": 151.0,
"r_y2": 86.3,
"r_x3": 122.0,
"r_y3": 86.3,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.7,
"r_y0": 91.5,
"r_x1": 321.7,
"r_y1": 91.5,
"r_x2": 321.7,
"r_y2": 86.6,
"r_x3": 311.7,
"r_y3": 86.6,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 287.9,
"r_y0": 146.7,
"r_x1": 310.1,
"r_y1": 146.7,
"r_x2": 310.1,
"r_y2": 141.7,
"r_x3": 287.9,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.2,
"r_y0": 98.0,
"r_x1": 299.4,
"r_y1": 98.0,
"r_x2": 299.4,
"r_y2": 93.1,
"r_x3": 289.2,
"r_y3": 93.1,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.6,
"r_y0": 104.2,
"r_x1": 299.4,
"r_y1": 104.2,
"r_x2": 299.4,
"r_y2": 99.2,
"r_x3": 285.6,
"r_y3": 99.2,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.3,
"r_y0": 110.3,
"r_x1": 299.4,
"r_y1": 110.3,
"r_x2": 299.4,
"r_y2": 105.3,
"r_x3": 285.3,
"r_y3": 105.3,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.4,
"r_y0": 125.3,
"r_x1": 299.2,
"r_y1": 125.3,
"r_x2": 299.2,
"r_y2": 120.4,
"r_x3": 285.4,
"r_y3": 120.4,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.1,
"r_y0": 131.5,
"r_x1": 299.2,
"r_y1": 131.5,
"r_x2": 299.2,
"r_y2": 126.5,
"r_x3": 285.1,
"r_y3": 126.5,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.3,
"r_y0": 146.7,
"r_x1": 328.8,
"r_y1": 146.7,
"r_x2": 328.8,
"r_y2": 141.7,
"r_x3": 311.3,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 299.6,
"r_y0": 91.7,
"r_x1": 309.6,
"r_y1": 91.7,
"r_x2": 309.6,
"r_y2": 86.7,
"r_x3": 299.6,
"r_y3": 86.7,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.0,
"r_y0": 146.6,
"r_x1": 483.5,
"r_y1": 146.6,
"r_x2": 483.5,
"r_y2": 141.7,
"r_x3": 466.0,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.0,
"r_y0": 98.7,
"r_x1": 469.2,
"r_y1": 98.7,
"r_x2": 469.2,
"r_y2": 93.8,
"r_x3": 459.0,
"r_y3": 93.8,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.4,
"r_y0": 104.8,
"r_x1": 469.2,
"r_y1": 104.8,
"r_x2": 469.2,
"r_y2": 99.9,
"r_x3": 455.4,
"r_y3": 99.9,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.0,
"r_y0": 111.0,
"r_x1": 469.2,
"r_y1": 111.0,
"r_x2": 469.2,
"r_y2": 106.0,
"r_x3": 455.0,
"r_y3": 106.0,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 467.4,
"r_y0": 90.5,
"r_x1": 480.7,
"r_y1": 90.5,
"r_x2": 480.7,
"r_y2": 85.6,
"r_x3": 467.4,
"r_y3": 85.6,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.4,
"r_y0": 146.5,
"r_x1": 182.6,
"r_y1": 146.5,
"r_x2": 182.6,
"r_y2": 141.6,
"r_x3": 160.4,
"r_y3": 141.6,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 153.7,
"r_y0": 99.8,
"r_x1": 173.3,
"r_y1": 99.8,
"r_x2": 173.3,
"r_y2": 94.9,
"r_x3": 153.7,
"r_y3": 94.9,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 154.5,
"r_y0": 105.9,
"r_x1": 173.3,
"r_y1": 105.9,
"r_x2": 173.3,
"r_y2": 101.0,
"r_x3": 154.5,
"r_y3": 101.0,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 155.3,
"r_y0": 112.1,
"r_x1": 173.3,
"r_y1": 112.1,
"r_x2": 173.3,
"r_y2": 107.1,
"r_x3": 155.3,
"r_y3": 107.1,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.4,
"r_y0": 112.2,
"r_x1": 346.0,
"r_y1": 112.2,
"r_x2": 346.0,
"r_y2": 107.2,
"r_x3": 326.4,
"r_y3": 107.2,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.2,
"r_y0": 118.3,
"r_x1": 346.0,
"r_y1": 118.3,
"r_x2": 346.0,
"r_y2": 113.4,
"r_x3": 327.2,
"r_y3": 113.4,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.9,
"r_y0": 124.4,
"r_x1": 346.0,
"r_y1": 124.4,
"r_x2": 346.0,
"r_y2": 119.5,
"r_x3": 327.9,
"r_y3": 119.5,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.0,
"r_y0": 109.1,
"r_x1": 508.8,
"r_y1": 109.1,
"r_x2": 508.8,
"r_y2": 104.2,
"r_x3": 489.0,
"r_y3": 104.2,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.2,
"r_y0": 115.2,
"r_x1": 508.8,
"r_y1": 115.2,
"r_x2": 508.8,
"r_y2": 110.3,
"r_x3": 490.2,
"r_y3": 110.3,
"coord_origin": "TOPLEFT"
},
"text": "doesn't",
"orig": "doesn't",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.7,
"r_y0": 121.4,
"r_x1": 508.8,
"r_y1": 121.4,
"r_x2": 508.8,
"r_y2": 116.4,
"r_x3": 489.7,
"r_y3": 116.4,
"coord_origin": "TOPLEFT"
},
"text": "provide",
"orig": "provide",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.7,
"r_y0": 127.5,
"r_x1": 508.8,
"r_y1": 127.5,
"r_x2": 508.8,
"r_y2": 122.5,
"r_x3": 490.7,
"r_y3": 122.5,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.4,
"r_y0": 146.7,
"r_x1": 202.8,
"r_y1": 146.7,
"r_x2": 202.8,
"r_y2": 141.7,
"r_x3": 185.4,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 168.5,
"r_y0": 91.1,
"r_x1": 197.5,
"r_y1": 91.1,
"r_x2": 197.5,
"r_y2": 86.1,
"r_x3": 168.5,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.4,
"r_y0": 91.0,
"r_x1": 367.4,
"r_y1": 91.0,
"r_x2": 367.4,
"r_y2": 86.0,
"r_x3": 357.4,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.7,
"r_y0": 146.6,
"r_x1": 374.9,
"r_y1": 146.6,
"r_x2": 374.9,
"r_y2": 141.6,
"r_x3": 333.7,
"r_y3": 141.6,
"coord_origin": "TOPLEFT"
},
"text": "Complex Simple",
"orig": "Complex Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.7,
"r_y0": 91.0,
"r_x1": 355.7,
"r_y1": 91.0,
"r_x2": 355.7,
"r_y2": 86.1,
"r_x3": 345.7,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.5,
"r_y0": 146.3,
"r_x1": 526.0,
"r_y1": 146.3,
"r_x2": 526.0,
"r_y2": 141.4,
"r_x3": 508.5,
"r_y3": 141.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 510.4,
"r_y0": 91.0,
"r_x1": 523.7,
"r_y1": 91.0,
"r_x2": 523.7,
"r_y2": 86.1,
"r_x3": 510.4,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": [
{
"id": 46,
"label": "text",
"bbox": {
"l": 119.4,
"t": 77.3,
"r": 151.9,
"b": 83.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 119.4,
"r_y0": 83.3,
"r_x1": 151.9,
"r_y1": 83.3,
"r_x2": 151.9,
"r_y2": 77.3,
"r_x3": 119.4,
"r_y3": 77.3,
"coord_origin": "TOPLEFT"
},
"text": "PubTabNet",
"orig": "PubTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 47,
"label": "text",
"bbox": {
"l": 53.3,
"t": 75.2,
"r": 59.3,
"b": 81.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 53.3,
"r_y0": 81.1,
"r_x1": 59.3,
"r_y1": 81.1,
"r_x2": 59.3,
"r_y2": 75.2,
"r_x3": 53.3,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "b.",
"orig": "b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 48,
"label": "text",
"bbox": {
"l": 289.6,
"t": 77.5,
"r": 319.8,
"b": 83.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.6,
"r_y0": 83.4,
"r_x1": 319.8,
"r_y1": 83.4,
"r_x2": 319.8,
"r_y2": 77.5,
"r_x3": 289.6,
"r_y3": 77.5,
"coord_origin": "TOPLEFT"
},
"text": "FinTabNet",
"orig": "FinTabNet",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 49,
"label": "text",
"bbox": {
"l": 448.4,
"t": 77.3,
"r": 481.8,
"b": 83.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 448.4,
"r_y0": 83.2,
"r_x1": 481.8,
"r_y1": 83.2,
"r_x2": 481.8,
"r_y2": 77.3,
"r_x3": 448.4,
"r_y3": 77.3,
"coord_origin": "TOPLEFT"
},
"text": "Table Bank",
"orig": "Table Bank",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 50,
"label": "text",
"bbox": {
"l": 82.6,
"t": 141.3,
"r": 95.0,
"b": 146.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.6,
"r_y0": 146.2,
"r_x1": 95.0,
"r_y1": 146.2,
"r_x2": 95.0,
"r_y2": 141.3,
"r_x3": 82.6,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Train",
"orig": "Train",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 51,
"label": "text",
"bbox": {
"l": 63.0,
"t": 101.1,
"r": 85.3,
"b": 106.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 63.0,
"r_y0": 106.1,
"r_x1": 85.3,
"r_y1": 106.1,
"r_x2": 85.3,
"r_y2": 101.1,
"r_x3": 63.0,
"r_y3": 101.1,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 52,
"label": "text",
"bbox": {
"l": 67.8,
"t": 124.4,
"r": 85.2,
"b": 129.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 67.8,
"r_y0": 129.4,
"r_x1": 85.2,
"r_y1": 129.4,
"r_x2": 85.2,
"r_y2": 124.4,
"r_x3": 67.8,
"r_y3": 124.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 53,
"label": "text",
"bbox": {
"l": 227.6,
"t": 102.5,
"r": 249.8,
"b": 107.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 227.6,
"r_y0": 107.5,
"r_x1": 249.8,
"r_y1": 107.5,
"r_x2": 249.8,
"r_y2": 102.5,
"r_x3": 227.6,
"r_y3": 102.5,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 54,
"label": "text",
"bbox": {
"l": 232.2,
"t": 127.0,
"r": 249.7,
"b": 131.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 232.2,
"r_y0": 131.9,
"r_x1": 249.7,
"r_y1": 131.9,
"r_x2": 249.7,
"r_y2": 127.0,
"r_x3": 232.2,
"r_y3": 127.0,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 55,
"label": "text",
"bbox": {
"l": 396.2,
"t": 114.0,
"r": 413.7,
"b": 119.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 396.2,
"r_y0": 119.0,
"r_x1": 413.7,
"r_y1": 119.0,
"r_x2": 413.7,
"r_y2": 114.0,
"r_x3": 396.2,
"r_y3": 114.0,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 56,
"label": "text",
"bbox": {
"l": 97.4,
"t": 141.3,
"r": 105.1,
"b": 146.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 97.4,
"r_y0": 146.2,
"r_x1": 105.1,
"r_y1": 146.2,
"r_x2": 105.1,
"r_y2": 141.3,
"r_x3": 97.4,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Val",
"orig": "Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 57,
"label": "text",
"bbox": {
"l": 60.9,
"t": 85.7,
"r": 76.2,
"b": 90.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 11,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 60.9,
"r_y0": 90.7,
"r_x1": 76.2,
"r_y1": 90.7,
"r_x2": 76.2,
"r_y2": 85.7,
"r_x3": 60.9,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 58,
"label": "text",
"bbox": {
"l": 82.3,
"t": 86.2,
"r": 107.0,
"b": 91.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 12,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 82.3,
"r_y0": 91.2,
"r_x1": 107.0,
"r_y1": 91.2,
"r_x2": 107.0,
"r_y2": 86.2,
"r_x3": 82.3,
"r_y3": 86.2,
"coord_origin": "TOPLEFT"
},
"text": "500K 10K",
"orig": "500K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 59,
"label": "text",
"bbox": {
"l": 246.2,
"t": 141.6,
"r": 281.9,
"b": 146.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 13,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 246.2,
"r_y0": 146.6,
"r_x1": 281.9,
"r_y1": 146.6,
"r_x2": 281.9,
"r_y2": 141.6,
"r_x3": 246.2,
"r_y3": 141.6,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 60,
"label": "text",
"bbox": {
"l": 226.7,
"t": 85.7,
"r": 241.9,
"b": 90.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 14,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 226.7,
"r_y0": 90.7,
"r_x1": 241.9,
"r_y1": 90.7,
"r_x2": 241.9,
"r_y2": 85.7,
"r_x3": 226.7,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "100%",
"orig": "100%",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 61,
"label": "text",
"bbox": {
"l": 249.9,
"t": 86.1,
"r": 282.5,
"b": 91.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 15,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 249.9,
"r_y0": 91.0,
"r_x1": 282.5,
"r_y1": 91.0,
"r_x2": 282.5,
"r_y2": 86.1,
"r_x3": 249.9,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "91K 10K 10K",
"orig": "91K 10K 10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 62,
"label": "text",
"bbox": {
"l": 410.2,
"t": 141.3,
"r": 444.7,
"b": 146.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 16,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 410.2,
"r_y0": 146.2,
"r_x1": 444.7,
"r_y1": 146.2,
"r_x2": 444.7,
"r_y2": 141.3,
"r_x3": 410.2,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Train Test Val",
"orig": "Train Test Val",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 63,
"label": "text",
"bbox": {
"l": 391.4,
"t": 85.7,
"r": 432.7,
"b": 90.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 17,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 391.4,
"r_y0": 90.7,
"r_x1": 432.7,
"r_y1": 90.7,
"r_x2": 432.7,
"r_y2": 85.7,
"r_x3": 391.4,
"r_y3": 85.7,
"coord_origin": "TOPLEFT"
},
"text": "100% 130K 5K",
"orig": "100% 130K 5K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 64,
"label": "text",
"bbox": {
"l": 435.6,
"t": 86.3,
"r": 445.6,
"b": 91.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 18,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 435.6,
"r_y0": 91.2,
"r_x1": 445.6,
"r_y1": 91.2,
"r_x2": 445.6,
"r_y2": 86.3,
"r_x3": 435.6,
"r_y3": 86.3,
"coord_origin": "TOPLEFT"
},
"text": "10K",
"orig": "10K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 65,
"label": "text",
"bbox": {
"l": 113.9,
"t": 141.3,
"r": 136.2,
"b": 146.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 19,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.9,
"r_y0": 146.2,
"r_x1": 136.2,
"r_y1": 146.2,
"r_x2": 136.2,
"r_y2": 141.3,
"r_x3": 113.9,
"r_y3": 141.3,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 66,
"label": "text",
"bbox": {
"l": 116.9,
"t": 94.8,
"r": 127.1,
"b": 99.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 20,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 116.9,
"r_y0": 99.8,
"r_x1": 127.1,
"r_y1": 99.8,
"r_x2": 127.1,
"r_y2": 94.8,
"r_x3": 116.9,
"r_y3": 94.8,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 67,
"label": "text",
"bbox": {
"l": 113.3,
"t": 100.9,
"r": 127.1,
"b": 105.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 21,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.3,
"r_y0": 105.9,
"r_x1": 127.1,
"r_y1": 105.9,
"r_x2": 127.1,
"r_y2": 100.9,
"r_x3": 113.3,
"r_y3": 100.9,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 68,
"label": "text",
"bbox": {
"l": 112.9,
"t": 107.1,
"r": 127.1,
"b": 112.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 22,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.9,
"r_y0": 112.0,
"r_x1": 127.1,
"r_y1": 112.0,
"r_x2": 127.1,
"r_y2": 107.1,
"r_x3": 112.9,
"r_y3": 107.1,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 69,
"label": "text",
"bbox": {
"l": 113.2,
"t": 122.6,
"r": 127.0,
"b": 127.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 23,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 113.2,
"r_y0": 127.6,
"r_x1": 127.0,
"r_y1": 127.6,
"r_x2": 127.0,
"r_y2": 122.6,
"r_x3": 113.2,
"r_y3": 122.6,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 70,
"label": "text",
"bbox": {
"l": 112.9,
"t": 128.7,
"r": 127.0,
"b": 133.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 24,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.9,
"r_y0": 133.7,
"r_x1": 127.0,
"r_y1": 133.7,
"r_x2": 127.0,
"r_y2": 128.7,
"r_x3": 112.9,
"r_y3": 128.7,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 71,
"label": "text",
"bbox": {
"l": 138.6,
"t": 141.4,
"r": 156.0,
"b": 146.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 25,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 138.6,
"r_y0": 146.4,
"r_x1": 156.0,
"r_y1": 146.4,
"r_x2": 156.0,
"r_y2": 141.4,
"r_x3": 138.6,
"r_y3": 141.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 72,
"label": "text",
"bbox": {
"l": 122.0,
"t": 86.3,
"r": 151.0,
"b": 91.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 26,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 122.0,
"r_y0": 91.2,
"r_x1": 151.0,
"r_y1": 91.2,
"r_x2": 151.0,
"r_y2": 86.3,
"r_x3": 122.0,
"r_y3": 86.3,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 73,
"label": "text",
"bbox": {
"l": 311.7,
"t": 86.6,
"r": 321.7,
"b": 91.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 27,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.7,
"r_y0": 91.5,
"r_x1": 321.7,
"r_y1": 91.5,
"r_x2": 321.7,
"r_y2": 86.6,
"r_x3": 311.7,
"r_y3": 86.6,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 74,
"label": "text",
"bbox": {
"l": 287.9,
"t": 141.7,
"r": 310.1,
"b": 146.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 28,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 287.9,
"r_y0": 146.7,
"r_x1": 310.1,
"r_y1": 146.7,
"r_x2": 310.1,
"r_y2": 141.7,
"r_x3": 287.9,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 75,
"label": "text",
"bbox": {
"l": 289.2,
"t": 93.1,
"r": 299.4,
"b": 98.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 29,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 289.2,
"r_y0": 98.0,
"r_x1": 299.4,
"r_y1": 98.0,
"r_x2": 299.4,
"r_y2": 93.1,
"r_x3": 289.2,
"r_y3": 93.1,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 76,
"label": "text",
"bbox": {
"l": 285.6,
"t": 99.2,
"r": 299.4,
"b": 104.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 30,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.6,
"r_y0": 104.2,
"r_x1": 299.4,
"r_y1": 104.2,
"r_x2": 299.4,
"r_y2": 99.2,
"r_x3": 285.6,
"r_y3": 99.2,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 77,
"label": "text",
"bbox": {
"l": 285.3,
"t": 105.3,
"r": 299.4,
"b": 110.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 31,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.3,
"r_y0": 110.3,
"r_x1": 299.4,
"r_y1": 110.3,
"r_x2": 299.4,
"r_y2": 105.3,
"r_x3": 285.3,
"r_y3": 105.3,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 78,
"label": "text",
"bbox": {
"l": 285.4,
"t": 120.4,
"r": 299.2,
"b": 125.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 32,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.4,
"r_y0": 125.3,
"r_x1": 299.2,
"r_y1": 125.3,
"r_x2": 299.2,
"r_y2": 120.4,
"r_x3": 285.4,
"r_y3": 120.4,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 79,
"label": "text",
"bbox": {
"l": 285.1,
"t": 126.5,
"r": 299.2,
"b": 131.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 33,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 285.1,
"r_y0": 131.5,
"r_x1": 299.2,
"r_y1": 131.5,
"r_x2": 299.2,
"r_y2": 126.5,
"r_x3": 285.1,
"r_y3": 126.5,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 80,
"label": "text",
"bbox": {
"l": 311.3,
"t": 141.7,
"r": 328.8,
"b": 146.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 34,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 311.3,
"r_y0": 146.7,
"r_x1": 328.8,
"r_y1": 146.7,
"r_x2": 328.8,
"r_y2": 141.7,
"r_x3": 311.3,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 81,
"label": "text",
"bbox": {
"l": 299.6,
"t": 86.7,
"r": 309.6,
"b": 91.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 35,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 299.6,
"r_y0": 91.7,
"r_x1": 309.6,
"r_y1": 91.7,
"r_x2": 309.6,
"r_y2": 86.7,
"r_x3": 299.6,
"r_y3": 86.7,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 82,
"label": "text",
"bbox": {
"l": 466.0,
"t": 141.7,
"r": 483.5,
"b": 146.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 36,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.0,
"r_y0": 146.6,
"r_x1": 483.5,
"r_y1": 146.6,
"r_x2": 483.5,
"r_y2": 141.7,
"r_x3": 466.0,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 83,
"label": "text",
"bbox": {
"l": 459.0,
"t": 93.8,
"r": 469.2,
"b": 98.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 37,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 459.0,
"r_y0": 98.7,
"r_x1": 469.2,
"r_y1": 98.7,
"r_x2": 469.2,
"r_y2": 93.8,
"r_x3": 459.0,
"r_y3": 93.8,
"coord_origin": "TOPLEFT"
},
"text": "Non",
"orig": "Non",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 84,
"label": "text",
"bbox": {
"l": 455.4,
"t": 99.9,
"r": 469.2,
"b": 104.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 38,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.4,
"r_y0": 104.8,
"r_x1": 469.2,
"r_y1": 104.8,
"r_x2": 469.2,
"r_y2": 99.9,
"r_x3": 455.4,
"r_y3": 99.9,
"coord_origin": "TOPLEFT"
},
"text": "Strict",
"orig": "Strict",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 85,
"label": "text",
"bbox": {
"l": 455.0,
"t": 106.0,
"r": 469.2,
"b": 111.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 39,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 455.0,
"r_y0": 111.0,
"r_x1": 469.2,
"r_y1": 111.0,
"r_x2": 469.2,
"r_y2": 106.0,
"r_x3": 455.0,
"r_y3": 106.0,
"coord_origin": "TOPLEFT"
},
"text": "HTML",
"orig": "HTML",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 86,
"label": "text",
"bbox": {
"l": 467.4,
"t": 85.6,
"r": 480.7,
"b": 90.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 40,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 467.4,
"r_y0": 90.5,
"r_x1": 480.7,
"r_y1": 90.5,
"r_x2": 480.7,
"r_y2": 85.6,
"r_x3": 467.4,
"r_y3": 85.6,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 87,
"label": "text",
"bbox": {
"l": 160.4,
"t": 141.6,
"r": 182.6,
"b": 146.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 41,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.4,
"r_y0": 146.5,
"r_x1": 182.6,
"r_y1": 146.5,
"r_x2": 182.6,
"r_y2": 141.6,
"r_x3": 160.4,
"r_y3": 141.6,
"coord_origin": "TOPLEFT"
},
"text": "Complex",
"orig": "Complex",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 88,
"label": "text",
"bbox": {
"l": 153.7,
"t": 94.9,
"r": 173.3,
"b": 99.8,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 42,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 153.7,
"r_y0": 99.8,
"r_x1": 173.3,
"r_y1": 99.8,
"r_x2": 173.3,
"r_y2": 94.9,
"r_x3": 153.7,
"r_y3": 94.9,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 89,
"label": "text",
"bbox": {
"l": 154.5,
"t": 101.0,
"r": 173.3,
"b": 105.9,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 43,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 154.5,
"r_y0": 105.9,
"r_x1": 173.3,
"r_y1": 105.9,
"r_x2": 173.3,
"r_y2": 101.0,
"r_x3": 154.5,
"r_y3": 101.0,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 90,
"label": "text",
"bbox": {
"l": 155.3,
"t": 107.1,
"r": 173.3,
"b": 112.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 44,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 155.3,
"r_y0": 112.1,
"r_x1": 173.3,
"r_y1": 112.1,
"r_x2": 173.3,
"r_y2": 107.1,
"r_x3": 155.3,
"r_y3": 107.1,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 91,
"label": "text",
"bbox": {
"l": 326.4,
"t": 107.2,
"r": 346.0,
"b": 112.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 45,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 326.4,
"r_y0": 112.2,
"r_x1": 346.0,
"r_y1": 112.2,
"r_x2": 346.0,
"r_y2": 107.2,
"r_x3": 326.4,
"r_y3": 107.2,
"coord_origin": "TOPLEFT"
},
"text": "Contain",
"orig": "Contain",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 92,
"label": "text",
"bbox": {
"l": 327.2,
"t": 113.4,
"r": 346.0,
"b": 118.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 46,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.2,
"r_y0": 118.3,
"r_x1": 346.0,
"r_y1": 118.3,
"r_x2": 346.0,
"r_y2": 113.4,
"r_x3": 327.2,
"r_y3": 113.4,
"coord_origin": "TOPLEFT"
},
"text": "Missing",
"orig": "Missing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 93,
"label": "text",
"bbox": {
"l": 327.9,
"t": 119.5,
"r": 346.0,
"b": 124.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 47,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 327.9,
"r_y0": 124.4,
"r_x1": 346.0,
"r_y1": 124.4,
"r_x2": 346.0,
"r_y2": 119.5,
"r_x3": 327.9,
"r_y3": 119.5,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 94,
"label": "text",
"bbox": {
"l": 489.0,
"t": 104.2,
"r": 508.8,
"b": 109.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 48,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.0,
"r_y0": 109.1,
"r_x1": 508.8,
"r_y1": 109.1,
"r_x2": 508.8,
"r_y2": 104.2,
"r_x3": 489.0,
"r_y3": 104.2,
"coord_origin": "TOPLEFT"
},
"text": "Dataset",
"orig": "Dataset",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 95,
"label": "text",
"bbox": {
"l": 490.2,
"t": 110.3,
"r": 508.8,
"b": 115.2,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 49,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.2,
"r_y0": 115.2,
"r_x1": 508.8,
"r_y1": 115.2,
"r_x2": 508.8,
"r_y2": 110.3,
"r_x3": 490.2,
"r_y3": 110.3,
"coord_origin": "TOPLEFT"
},
"text": "doesn't",
"orig": "doesn't",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 96,
"label": "text",
"bbox": {
"l": 489.7,
"t": 116.4,
"r": 508.8,
"b": 121.4,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 50,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 489.7,
"r_y0": 121.4,
"r_x1": 508.8,
"r_y1": 121.4,
"r_x2": 508.8,
"r_y2": 116.4,
"r_x3": 489.7,
"r_y3": 116.4,
"coord_origin": "TOPLEFT"
},
"text": "provide",
"orig": "provide",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 97,
"label": "text",
"bbox": {
"l": 490.7,
"t": 122.5,
"r": 508.8,
"b": 127.5,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 51,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 490.7,
"r_y0": 127.5,
"r_x1": 508.8,
"r_y1": 127.5,
"r_x2": 508.8,
"r_y2": 122.5,
"r_x3": 490.7,
"r_y3": 122.5,
"coord_origin": "TOPLEFT"
},
"text": "bboxes",
"orig": "bboxes",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 98,
"label": "text",
"bbox": {
"l": 185.4,
"t": 141.7,
"r": 202.8,
"b": 146.7,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 52,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.4,
"r_y0": 146.7,
"r_x1": 202.8,
"r_y1": 146.7,
"r_x2": 202.8,
"r_y2": 141.7,
"r_x3": 185.4,
"r_y3": 141.7,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 99,
"label": "text",
"bbox": {
"l": 168.5,
"t": 86.1,
"r": 197.5,
"b": 91.1,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 53,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 168.5,
"r_y0": 91.1,
"r_x1": 197.5,
"r_y1": 91.1,
"r_x2": 197.5,
"r_y2": 86.1,
"r_x3": 168.5,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "230K 280K",
"orig": "230K 280K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 100,
"label": "text",
"bbox": {
"l": 357.4,
"t": 86.0,
"r": 367.4,
"b": 91.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 54,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 357.4,
"r_y0": 91.0,
"r_x1": 367.4,
"r_y1": 91.0,
"r_x2": 367.4,
"r_y2": 86.0,
"r_x3": 357.4,
"r_y3": 86.0,
"coord_origin": "TOPLEFT"
},
"text": "65K",
"orig": "65K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 101,
"label": "text",
"bbox": {
"l": 333.7,
"t": 141.6,
"r": 374.9,
"b": 146.6,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 55,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 333.7,
"r_y0": 146.6,
"r_x1": 374.9,
"r_y1": 146.6,
"r_x2": 374.9,
"r_y2": 141.6,
"r_x3": 333.7,
"r_y3": 141.6,
"coord_origin": "TOPLEFT"
},
"text": "Complex Simple",
"orig": "Complex Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 102,
"label": "text",
"bbox": {
"l": 345.7,
"t": 86.1,
"r": 355.7,
"b": 91.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 56,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.7,
"r_y0": 91.0,
"r_x1": 355.7,
"r_y1": 91.0,
"r_x2": 355.7,
"r_y2": 86.1,
"r_x3": 345.7,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "47K",
"orig": "47K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 103,
"label": "text",
"bbox": {
"l": 508.5,
"t": 141.4,
"r": 526.0,
"b": 146.3,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 57,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 508.5,
"r_y0": 146.3,
"r_x1": 526.0,
"r_y1": 146.3,
"r_x2": 526.0,
"r_y2": 141.4,
"r_x3": 508.5,
"r_y3": 141.4,
"coord_origin": "TOPLEFT"
},
"text": "Simple",
"orig": "Simple",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 104,
"label": "text",
"bbox": {
"l": 510.4,
"t": 86.1,
"r": 523.7,
"b": 91.0,
"coord_origin": "TOPLEFT"
},
"confidence": 1.0,
"cells": [
{
"index": 58,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 510.4,
"r_y0": 91.0,
"r_x1": 523.7,
"r_y1": 91.0,
"r_x2": 523.7,
"r_y2": 86.1,
"r_x3": 510.4,
"r_y3": 86.1,
"coord_origin": "TOPLEFT"
},
"text": "145K",
"orig": "145K",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
}
]
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "caption",
"id": 1,
"page_no": 11,
"cluster": {
"id": 1,
"label": "caption",
"bbox": {
"l": 50.1,
"t": 165.5,
"r": 545.1,
"b": 186.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.97,
"cells": [
{
"index": 59,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 174.4,
"r_x1": 545.1,
"r_y1": 174.4,
"r_x2": 545.1,
"r_y2": 165.5,
"r_x3": 50.1,
"r_y3": 165.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,",
"orig": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 60,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 186.4,
"r_x1": 513.5,
"r_y1": 186.4,
"r_x2": 513.5,
"r_y2": 177.5,
"r_x3": 50.1,
"r_y3": 177.5,
"coord_origin": "TOPLEFT"
},
"text": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.",
"orig": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split, strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity."
},
{
"label": "list_item",
"id": 4,
"page_no": 11,
"cluster": {
"id": 4,
"label": "list_item",
"bbox": {
"l": 61.6,
"t": 210.9,
"r": 286.4,
"b": 231.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 61,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 219.8,
"r_x1": 71.1,
"r_y1": 219.8,
"r_x2": 71.1,
"r_y2": 210.9,
"r_x3": 61.6,
"r_y3": 210.9,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 62,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.5,
"r_y0": 219.8,
"r_x1": 286.4,
"r_y1": 219.8,
"r_x2": 286.4,
"r_y2": 210.9,
"r_x3": 73.5,
"r_y3": 210.9,
"coord_origin": "TOPLEFT"
},
"text": "TableFormer output does not include the table cell con-",
"orig": "TableFormer output does not include the table cell con-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 63,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 231.8,
"r_x1": 87.5,
"r_y1": 231.8,
"r_x2": 87.5,
"r_y2": 222.9,
"r_x3": 70.0,
"r_y3": 222.9,
"coord_origin": "TOPLEFT"
},
"text": "tent.",
"orig": "tent.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 TableFormer output does not include the table cell content."
},
{
"label": "list_item",
"id": 3,
"page_no": 11,
"cluster": {
"id": 3,
"label": "list_item",
"bbox": {
"l": 61.6,
"t": 244.1,
"r": 286.4,
"b": 264.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 64,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 61.6,
"r_y0": 253.0,
"r_x1": 71.3,
"r_y1": 253.0,
"r_x2": 71.3,
"r_y2": 244.1,
"r_x3": 61.6,
"r_y3": 244.1,
"coord_origin": "TOPLEFT"
},
"text": "\u2022",
"orig": "\u2022",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 65,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 73.8,
"r_y0": 253.0,
"r_x1": 286.4,
"r_y1": 253.0,
"r_x2": 286.4,
"r_y2": 244.1,
"r_x3": 73.8,
"r_y3": 244.1,
"coord_origin": "TOPLEFT"
},
"text": "There are occasional inaccuracies in the predictions of",
"orig": "There are occasional inaccuracies in the predictions of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 66,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 70.0,
"r_y0": 264.9,
"r_x1": 150.4,
"r_y1": 264.9,
"r_x2": 150.4,
"r_y2": 256.0,
"r_x3": 70.0,
"r_y3": 256.0,
"coord_origin": "TOPLEFT"
},
"text": "the bounding boxes.",
"orig": "the bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "\u00b7 There are occasional inaccuracies in the predictions of the bounding boxes."
},
{
"label": "text",
"id": 0,
"page_no": 11,
"cluster": {
"id": 0,
"label": "text",
"bbox": {
"l": 50.1,
"t": 279.2,
"r": 286.4,
"b": 395.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.98,
"cells": [
{
"index": 67,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 288.1,
"r_x1": 286.4,
"r_y1": 288.1,
"r_x2": 286.4,
"r_y2": 279.2,
"r_x3": 62.1,
"r_y3": 279.2,
"coord_origin": "TOPLEFT"
},
"text": "However, it is possible to mitigate those limitations by",
"orig": "However, it is possible to mitigate those limitations by",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 68,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 300.1,
"r_x1": 286.4,
"r_y1": 300.1,
"r_x2": 286.4,
"r_y2": 291.2,
"r_x3": 50.1,
"r_y3": 291.2,
"coord_origin": "TOPLEFT"
},
"text": "combining the TableFormer predictions with the informa-",
"orig": "combining the TableFormer predictions with the informa-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 69,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 312.0,
"r_x1": 286.4,
"r_y1": 312.0,
"r_x2": 286.4,
"r_y2": 303.1,
"r_x3": 50.1,
"r_y3": 303.1,
"coord_origin": "TOPLEFT"
},
"text": "tion already present inside a programmatic PDF document.",
"orig": "tion already present inside a programmatic PDF document.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 70,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 324.0,
"r_x1": 286.4,
"r_y1": 324.0,
"r_x2": 286.4,
"r_y2": 315.1,
"r_x3": 50.1,
"r_y3": 315.1,
"coord_origin": "TOPLEFT"
},
"text": "More specifically, PDF documents can be seen as a se-",
"orig": "More specifically, PDF documents can be seen as a se-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 71,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 335.9,
"r_x1": 286.4,
"r_y1": 335.9,
"r_x2": 286.4,
"r_y2": 327.0,
"r_x3": 50.1,
"r_y3": 327.0,
"coord_origin": "TOPLEFT"
},
"text": "quence of PDF cells where each cell is described by its con-",
"orig": "quence of PDF cells where each cell is described by its con-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 72,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 347.9,
"r_x1": 286.4,
"r_y1": 347.9,
"r_x2": 286.4,
"r_y2": 339.0,
"r_x3": 50.1,
"r_y3": 339.0,
"coord_origin": "TOPLEFT"
},
"text": "tent and bounding box. If we are able to associate the PDF",
"orig": "tent and bounding box. If we are able to associate the PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 73,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 359.8,
"r_x1": 286.4,
"r_y1": 359.8,
"r_x2": 286.4,
"r_y2": 350.9,
"r_x3": 50.1,
"r_y3": 350.9,
"coord_origin": "TOPLEFT"
},
"text": "cells with the predicted table cells, we can directly link the",
"orig": "cells with the predicted table cells, we can directly link the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 74,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 371.8,
"r_x1": 286.4,
"r_y1": 371.8,
"r_x2": 286.4,
"r_y2": 362.9,
"r_x3": 50.1,
"r_y3": 362.9,
"coord_origin": "TOPLEFT"
},
"text": "PDF cell content to the table cell structure and use the PDF",
"orig": "PDF cell content to the table cell structure and use the PDF",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 75,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 383.8,
"r_x1": 286.4,
"r_y1": 383.8,
"r_x2": 286.4,
"r_y2": 374.8,
"r_x3": 50.1,
"r_y3": 374.8,
"coord_origin": "TOPLEFT"
},
"text": "bounding boxes to correct misalignments in the predicted",
"orig": "bounding boxes to correct misalignments in the predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 76,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 395.7,
"r_x1": 154.6,
"r_y1": 395.7,
"r_x2": 154.6,
"r_y2": 386.8,
"r_x3": 50.1,
"r_y3": 386.8,
"coord_origin": "TOPLEFT"
},
"text": "table cell bounding boxes.",
"orig": "table cell bounding boxes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "However, it is possible to mitigate those limitations by combining the TableFormer predictions with the information already present inside a programmatic PDF document. More specifically, PDF documents can be seen as a sequence of PDF cells where each cell is described by its content and bounding box. If we are able to associate the PDF cells with the predicted table cells, we can directly link the PDF cell content to the table cell structure and use the PDF bounding boxes to correct misalignments in the predicted table cell bounding boxes."
},
{
"label": "text",
"id": 11,
"page_no": 11,
"cluster": {
"id": 11,
"label": "text",
"bbox": {
"l": 50.1,
"t": 399.1,
"r": 286.4,
"b": 419.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 77,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 408.0,
"r_x1": 286.4,
"r_y1": 408.0,
"r_x2": 286.4,
"r_y2": 399.1,
"r_x3": 62.1,
"r_y3": 399.1,
"coord_origin": "TOPLEFT"
},
"text": "Here is a step-by-step description of the prediction post-",
"orig": "Here is a step-by-step description of the prediction post-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 78,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 419.9,
"r_x1": 95.5,
"r_y1": 419.9,
"r_x2": 95.5,
"r_y2": 411.0,
"r_x3": 50.1,
"r_y3": 411.0,
"coord_origin": "TOPLEFT"
},
"text": "processing:",
"orig": "processing:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Here is a step-by-step description of the prediction postprocessing:"
},
{
"label": "list_item",
"id": 20,
"page_no": 11,
"cluster": {
"id": 20,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 423.3,
"r": 286.4,
"b": 456.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.83,
"cells": [
{
"index": 79,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 432.2,
"r_x1": 69.4,
"r_y1": 432.2,
"r_x2": 69.4,
"r_y2": 423.3,
"r_x3": 62.1,
"r_y3": 423.3,
"coord_origin": "TOPLEFT"
},
"text": "1.",
"orig": "1.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 80,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 71.8,
"r_y0": 432.2,
"r_x1": 286.4,
"r_y1": 432.2,
"r_x2": 286.4,
"r_y2": 423.3,
"r_x3": 71.8,
"r_y3": 423.3,
"coord_origin": "TOPLEFT"
},
"text": "Get the minimal grid dimensions - number of rows and",
"orig": "Get the minimal grid dimensions - number of rows and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 81,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 444.2,
"r_x1": 286.4,
"r_y1": 444.2,
"r_x2": 286.4,
"r_y2": 435.3,
"r_x3": 50.1,
"r_y3": 435.3,
"coord_origin": "TOPLEFT"
},
"text": "columns for the predicted table structure. This represents",
"orig": "columns for the predicted table structure. This represents",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 82,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 456.1,
"r_x1": 274.5,
"r_y1": 456.1,
"r_x2": 274.5,
"r_y2": 447.2,
"r_x3": 50.1,
"r_y3": 447.2,
"coord_origin": "TOPLEFT"
},
"text": "the most granular grid for the underlying table structure.",
"orig": "the most granular grid for the underlying table structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "1. Get the minimal grid dimensions - number of rows and columns for the predicted table structure. This represents the most granular grid for the underlying table structure."
},
{
"label": "list_item",
"id": 2,
"page_no": 11,
"cluster": {
"id": 2,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 459.5,
"r": 286.4,
"b": 504.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 83,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 468.4,
"r_x1": 69.5,
"r_y1": 468.4,
"r_x2": 69.5,
"r_y2": 459.5,
"r_x3": 62.1,
"r_y3": 459.5,
"coord_origin": "TOPLEFT"
},
"text": "2.",
"orig": "2.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 84,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 77.4,
"r_y0": 468.4,
"r_x1": 286.4,
"r_y1": 468.4,
"r_x2": 286.4,
"r_y2": 459.5,
"r_x3": 77.4,
"r_y3": 459.5,
"coord_origin": "TOPLEFT"
},
"text": "Generate pair-wise matches between the bounding",
"orig": "Generate pair-wise matches between the bounding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 85,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 480.3,
"r_x1": 286.4,
"r_y1": 480.3,
"r_x2": 286.4,
"r_y2": 471.4,
"r_x3": 50.1,
"r_y3": 471.4,
"coord_origin": "TOPLEFT"
},
"text": "boxes of the PDF cells and the predicted cells. The Intersec-",
"orig": "boxes of the PDF cells and the predicted cells. The Intersec-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 86,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 492.3,
"r_x1": 286.4,
"r_y1": 492.3,
"r_x2": 286.4,
"r_y2": 483.4,
"r_x3": 50.1,
"r_y3": 483.4,
"coord_origin": "TOPLEFT"
},
"text": "tion Over Union (IOU) metric is used to evaluate the quality",
"orig": "tion Over Union (IOU) metric is used to evaluate the quality",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 87,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 504.2,
"r_x1": 110.7,
"r_y1": 504.2,
"r_x2": 110.7,
"r_y2": 495.3,
"r_x3": 50.1,
"r_y3": 495.3,
"coord_origin": "TOPLEFT"
},
"text": "of the matches.",
"orig": "of the matches.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "2. Generate pair-wise matches between the bounding boxes of the PDF cells and the predicted cells. The Intersection Over Union (IOU) metric is used to evaluate the quality of the matches."
},
{
"label": "list_item",
"id": 10,
"page_no": 11,
"cluster": {
"id": 10,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 507.6,
"r": 286.4,
"b": 528.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 88,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 516.5,
"r_x1": 69.9,
"r_y1": 516.5,
"r_x2": 69.9,
"r_y2": 507.6,
"r_x3": 62.1,
"r_y3": 507.6,
"coord_origin": "TOPLEFT"
},
"text": "3.",
"orig": "3.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 89,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 72.5,
"r_y0": 516.5,
"r_x1": 286.4,
"r_y1": 516.5,
"r_x2": 286.4,
"r_y2": 507.6,
"r_x3": 72.5,
"r_y3": 507.6,
"coord_origin": "TOPLEFT"
},
"text": "Use a carefully selected IOU threshold to designate",
"orig": "Use a carefully selected IOU threshold to designate",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 90,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 528.5,
"r_x1": 226.1,
"r_y1": 528.5,
"r_x2": 226.1,
"r_y2": 519.6,
"r_x3": 50.1,
"r_y3": 519.6,
"coord_origin": "TOPLEFT"
},
"text": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.",
"orig": "the matches as \u201cgood\u201d ones and \u201cbad\u201d ones.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "3. Use a carefully selected IOU threshold to designate the matches as \"good\" ones and \"bad\" ones."
},
{
"label": "list_item",
"id": 8,
"page_no": 11,
"cluster": {
"id": 8,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 531.8,
"r": 286.4,
"b": 564.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 91,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 540.7,
"r_x1": 286.4,
"r_y1": 540.7,
"r_x2": 286.4,
"r_y2": 531.8,
"r_x3": 62.1,
"r_y3": 531.8,
"coord_origin": "TOPLEFT"
},
"text": "3.a. If all IOU scores in a column are below the thresh-",
"orig": "3.a. If all IOU scores in a column are below the thresh-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 92,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 552.7,
"r_x1": 286.4,
"r_y1": 552.7,
"r_x2": 286.4,
"r_y2": 543.8,
"r_x3": 50.1,
"r_y3": 543.8,
"coord_origin": "TOPLEFT"
},
"text": "old, discard all predictions (structure and bounding boxes)",
"orig": "old, discard all predictions (structure and bounding boxes)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 93,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 564.7,
"r_x1": 114.0,
"r_y1": 564.7,
"r_x2": 114.0,
"r_y2": 555.7,
"r_x3": 50.1,
"r_y3": 555.7,
"coord_origin": "TOPLEFT"
},
"text": "for that column.",
"orig": "for that column.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "3.a. If all IOU scores in a column are below the threshold, discard all predictions (structure and bounding boxes) for that column."
},
{
"label": "list_item",
"id": 5,
"page_no": 11,
"cluster": {
"id": 5,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 568.0,
"r": 286.4,
"b": 600.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 94,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 576.9,
"r_x1": 69.5,
"r_y1": 576.9,
"r_x2": 69.5,
"r_y2": 568.0,
"r_x3": 62.1,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "4.",
"orig": "4.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 95,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.7,
"r_y0": 576.9,
"r_x1": 286.4,
"r_y1": 576.9,
"r_x2": 286.4,
"r_y2": 568.0,
"r_x3": 76.7,
"r_y3": 568.0,
"coord_origin": "TOPLEFT"
},
"text": "Find the best-fitting content alignment for the pre-",
"orig": "Find the best-fitting content alignment for the pre-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 96,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 588.9,
"r_x1": 286.4,
"r_y1": 588.9,
"r_x2": 286.4,
"r_y2": 580.0,
"r_x3": 50.1,
"r_y3": 580.0,
"coord_origin": "TOPLEFT"
},
"text": "dicted cells with good IOU per each column. The alignment",
"orig": "dicted cells with good IOU per each column. The alignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 97,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 600.8,
"r_x1": 278.7,
"r_y1": 600.8,
"r_x2": 278.7,
"r_y2": 591.9,
"r_x3": 50.1,
"r_y3": 591.9,
"coord_origin": "TOPLEFT"
},
"text": "of the column can be identified by the following formula:",
"orig": "of the column can be identified by the following formula:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "4. Find the best-fitting content alignment for the predicted cells with good IOU per each column. The alignment of the column can be identified by the following formula:"
},
{
"label": "formula",
"id": 12,
"page_no": 11,
"cluster": {
"id": 12,
"label": "formula",
"bbox": {
"l": 110.7,
"t": 623.4,
"r": 286.4,
"b": 654.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 98,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 112.0,
"r_y0": 632.8,
"r_x1": 158.0,
"r_y1": 632.8,
"r_x2": 158.0,
"r_y2": 624.0,
"r_x3": 112.0,
"r_y3": 624.0,
"coord_origin": "TOPLEFT"
},
"text": "alignment",
"orig": "alignment",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 99,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 160.7,
"r_y0": 632.8,
"r_x1": 203.5,
"r_y1": 632.8,
"r_x2": 203.5,
"r_y2": 624.0,
"r_x3": 160.7,
"r_y3": 624.0,
"coord_origin": "TOPLEFT"
},
"text": "= arg min",
"orig": "= arg min",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 100,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 185.6,
"r_y0": 640.2,
"r_x1": 189.1,
"r_y1": 640.2,
"r_x2": 189.1,
"r_y2": 634.0,
"r_x3": 185.6,
"r_y3": 634.0,
"coord_origin": "TOPLEFT"
},
"text": "c",
"orig": "c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 101,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 203.5,
"r_y0": 632.8,
"r_x1": 208.5,
"r_y1": 632.8,
"r_x2": 208.5,
"r_y2": 623.4,
"r_x3": 203.5,
"r_y3": 623.4,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 102,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 208.5,
"r_y0": 632.8,
"r_x1": 220.3,
"r_y1": 632.8,
"r_x2": 220.3,
"r_y2": 624.0,
"r_x3": 208.5,
"r_y3": 624.0,
"coord_origin": "TOPLEFT"
},
"text": "D$_{c}$",
"orig": "D$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 103,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 632.8,
"r_x1": 225.8,
"r_y1": 632.8,
"r_x2": 225.8,
"r_y2": 623.4,
"r_x3": 220.8,
"r_y3": 623.4,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 104,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 110.7,
"r_y0": 654.1,
"r_x1": 122.5,
"r_y1": 654.1,
"r_x2": 122.5,
"r_y2": 645.3,
"r_x3": 110.7,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "D$_{c}$",
"orig": "D$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 105,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 125.8,
"r_y0": 654.1,
"r_x1": 133.5,
"r_y1": 654.1,
"r_x2": 133.5,
"r_y2": 645.3,
"r_x3": 125.8,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "=",
"orig": "=",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 106,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 136.3,
"r_y0": 654.1,
"r_x1": 156.0,
"r_y1": 654.1,
"r_x2": 156.0,
"r_y2": 645.3,
"r_x3": 136.3,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "max",
"orig": "max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 107,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 156.0,
"r_y0": 654.1,
"r_x1": 161.0,
"r_y1": 654.1,
"r_x2": 161.0,
"r_y2": 644.7,
"r_x3": 156.0,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 108,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 161.0,
"r_y0": 654.1,
"r_x1": 170.2,
"r_y1": 654.1,
"r_x2": 170.2,
"r_y2": 645.3,
"r_x3": 161.0,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 109,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 170.7,
"r_y0": 654.1,
"r_x1": 185.7,
"r_y1": 654.1,
"r_x2": 185.7,
"r_y2": 644.7,
"r_x3": 170.7,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "} \u2212",
"orig": "} \u2212",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 110,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 187.9,
"r_y0": 654.1,
"r_x1": 206.1,
"r_y1": 654.1,
"r_x2": 206.1,
"r_y2": 645.3,
"r_x3": 187.9,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "min",
"orig": "min",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 111,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 206.1,
"r_y0": 654.1,
"r_x1": 211.0,
"r_y1": 654.1,
"r_x2": 211.0,
"r_y2": 644.7,
"r_x3": 206.1,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 112,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 211.0,
"r_y0": 654.1,
"r_x1": 220.3,
"r_y1": 654.1,
"r_x2": 220.3,
"r_y2": 645.3,
"r_x3": 211.0,
"r_y3": 645.3,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 113,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 220.8,
"r_y0": 654.1,
"r_x1": 225.8,
"r_y1": 654.1,
"r_x2": 225.8,
"r_y2": 644.7,
"r_x3": 220.8,
"r_y3": 644.7,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 114,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 274.7,
"r_y0": 643.8,
"r_x1": 286.4,
"r_y1": 643.8,
"r_x2": 286.4,
"r_y2": 634.9,
"r_x3": 274.7,
"r_y3": 634.9,
"coord_origin": "TOPLEFT"
},
"text": "(4)",
"orig": "(4)",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "alignment = arg min c { D$_{c}$ } D$_{c}$ = max { x$_{c}$ } \u2212 min { x$_{c}$ } (4)"
},
{
"label": "text",
"id": 7,
"page_no": 11,
"cluster": {
"id": 7,
"label": "text",
"bbox": {
"l": 50.1,
"t": 667.3,
"r": 286.4,
"b": 688.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 115,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 677.0,
"r_x1": 74.5,
"r_y1": 677.0,
"r_x2": 74.5,
"r_y2": 668.1,
"r_x3": 50.1,
"r_y3": 668.1,
"coord_origin": "TOPLEFT"
},
"text": "where",
"orig": "where",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 116,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 78.3,
"r_y0": 676.8,
"r_x1": 82.6,
"r_y1": 676.8,
"r_x2": 82.6,
"r_y2": 667.9,
"r_x3": 78.3,
"r_y3": 667.9,
"coord_origin": "TOPLEFT"
},
"text": "c",
"orig": "c",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 117,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 86.5,
"r_y0": 677.0,
"r_x1": 123.6,
"r_y1": 677.0,
"r_x2": 123.6,
"r_y2": 668.1,
"r_x3": 86.5,
"r_y3": 668.1,
"coord_origin": "TOPLEFT"
},
"text": "is one of",
"orig": "is one of",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 118,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 127.5,
"r_y0": 676.8,
"r_x1": 132.5,
"r_y1": 676.8,
"r_x2": 132.5,
"r_y2": 667.3,
"r_x3": 127.5,
"r_y3": 667.3,
"coord_origin": "TOPLEFT"
},
"text": "{",
"orig": "{",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 119,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 132.5,
"r_y0": 677.0,
"r_x1": 210.7,
"r_y1": 677.0,
"r_x2": 210.7,
"r_y2": 668.1,
"r_x3": 132.5,
"r_y3": 668.1,
"coord_origin": "TOPLEFT"
},
"text": "left, centroid, right",
"orig": "left, centroid, right",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 120,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 210.7,
"r_y0": 676.8,
"r_x1": 215.7,
"r_y1": 676.8,
"r_x2": 215.7,
"r_y2": 667.3,
"r_x3": 210.7,
"r_y3": 667.3,
"coord_origin": "TOPLEFT"
},
"text": "}",
"orig": "}",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 121,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 219.6,
"r_y0": 677.0,
"r_x1": 233.9,
"r_y1": 677.0,
"r_x2": 233.9,
"r_y2": 668.1,
"r_x3": 219.6,
"r_y3": 668.1,
"coord_origin": "TOPLEFT"
},
"text": "and",
"orig": "and",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 122,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 237.8,
"r_y0": 676.8,
"r_x1": 247.1,
"r_y1": 676.8,
"r_x2": 247.1,
"r_y2": 667.9,
"r_x3": 237.8,
"r_y3": 667.9,
"coord_origin": "TOPLEFT"
},
"text": "x$_{c}$",
"orig": "x$_{c}$",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 123,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 251.5,
"r_y0": 677.0,
"r_x1": 286.4,
"r_y1": 677.0,
"r_x2": 286.4,
"r_y2": 668.1,
"r_x3": 251.5,
"r_y3": 668.1,
"coord_origin": "TOPLEFT"
},
"text": "is the x-",
"orig": "is the x-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 124,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 688.9,
"r_x1": 205.9,
"r_y1": 688.9,
"r_x2": 205.9,
"r_y2": 680.0,
"r_x3": 50.1,
"r_y3": 680.0,
"coord_origin": "TOPLEFT"
},
"text": "coordinate for the corresponding point.",
"orig": "coordinate for the corresponding point.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "where c is one of { left, centroid, right } and x$_{c}$ is the xcoordinate for the corresponding point."
},
{
"label": "list_item",
"id": 13,
"page_no": 11,
"cluster": {
"id": 13,
"label": "list_item",
"bbox": {
"l": 50.1,
"t": 692.3,
"r": 286.4,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 125,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 701.2,
"r_x1": 69.5,
"r_y1": 701.2,
"r_x2": 69.5,
"r_y2": 692.3,
"r_x3": 62.1,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "5.",
"orig": "5.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 126,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 76.3,
"r_y0": 701.2,
"r_x1": 286.4,
"r_y1": 701.2,
"r_x2": 286.4,
"r_y2": 692.3,
"r_x3": 76.3,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "Use the alignment computed in step 4, to compute",
"orig": "Use the alignment computed in step 4, to compute",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 127,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 713.2,
"r_x1": 94.6,
"r_y1": 713.2,
"r_x2": 94.6,
"r_y2": 704.2,
"r_x3": 50.1,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "the median",
"orig": "the median",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 128,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 97.6,
"r_y0": 712.9,
"r_x1": 103.3,
"r_y1": 712.9,
"r_x2": 103.3,
"r_y2": 704.1,
"r_x3": 97.6,
"r_y3": 704.1,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 129,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.3,
"r_y0": 713.2,
"r_x1": 286.4,
"r_y1": 713.2,
"r_x2": 286.4,
"r_y2": 704.2,
"r_x3": 103.3,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "-coordinate for all table columns and the me-",
"orig": "-coordinate for all table columns and the me-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "5. Use the alignment computed in step 4, to compute the median x -coordinate for all table columns and the me-"
},
{
"label": "text",
"id": 16,
"page_no": 11,
"cluster": {
"id": 16,
"label": "text",
"bbox": {
"l": 308.9,
"t": 210.9,
"r": 545.1,
"b": 255.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 130,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 219.8,
"r_x1": 545.1,
"r_y1": 219.8,
"r_x2": 545.1,
"r_y2": 210.9,
"r_x3": 308.9,
"r_y3": 210.9,
"coord_origin": "TOPLEFT"
},
"text": "dian cell size for all table cells. The usage of median dur-",
"orig": "dian cell size for all table cells. The usage of median dur-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 131,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 231.8,
"r_x1": 545.1,
"r_y1": 231.8,
"r_x2": 545.1,
"r_y2": 222.9,
"r_x3": 308.9,
"r_y3": 222.9,
"coord_origin": "TOPLEFT"
},
"text": "ing the computations, helps to eliminate outliers caused by",
"orig": "ing the computations, helps to eliminate outliers caused by",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 132,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 243.7,
"r_x1": 545.1,
"r_y1": 243.7,
"r_x2": 545.1,
"r_y2": 234.8,
"r_x3": 308.9,
"r_y3": 234.8,
"coord_origin": "TOPLEFT"
},
"text": "occasional column spans which are usually wider than the",
"orig": "occasional column spans which are usually wider than the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 133,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 255.7,
"r_x1": 339.6,
"r_y1": 255.7,
"r_x2": 339.6,
"r_y2": 246.8,
"r_x3": 308.9,
"r_y3": 246.8,
"coord_origin": "TOPLEFT"
},
"text": "normal.",
"orig": "normal.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "dian cell size for all table cells. The usage of median during the computations, helps to eliminate outliers caused by occasional column spans which are usually wider than the normal."
},
{
"label": "list_item",
"id": 9,
"page_no": 11,
"cluster": {
"id": 9,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 259.1,
"r": 545.1,
"b": 280.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.94,
"cells": [
{
"index": 134,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 268.0,
"r_x1": 328.3,
"r_y1": 268.0,
"r_x2": 328.3,
"r_y2": 259.1,
"r_x3": 320.8,
"r_y3": 259.1,
"coord_origin": "TOPLEFT"
},
"text": "6.",
"orig": "6.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 135,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 334.9,
"r_y0": 268.0,
"r_x1": 545.1,
"r_y1": 268.0,
"r_x2": 545.1,
"r_y2": 259.1,
"r_x3": 334.9,
"r_y3": 259.1,
"coord_origin": "TOPLEFT"
},
"text": "Snap all cells with bad IOU to their corresponding",
"orig": "Snap all cells with bad IOU to their corresponding",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 136,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 280.0,
"r_x1": 338.2,
"r_y1": 280.0,
"r_x2": 338.2,
"r_y2": 271.1,
"r_x3": 308.9,
"r_y3": 271.1,
"coord_origin": "TOPLEFT"
},
"text": "median",
"orig": "median",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 137,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 340.7,
"r_y0": 279.7,
"r_x1": 346.4,
"r_y1": 279.7,
"r_x2": 346.4,
"r_y2": 270.9,
"r_x3": 340.7,
"r_y3": 270.9,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 138,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 346.4,
"r_y0": 280.0,
"r_x1": 453.7,
"r_y1": 280.0,
"r_x2": 453.7,
"r_y2": 271.1,
"r_x3": 346.4,
"r_y3": 271.1,
"coord_origin": "TOPLEFT"
},
"text": "-coordinates and cell sizes.",
"orig": "-coordinates and cell sizes.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "6. Snap all cells with bad IOU to their corresponding median x -coordinates and cell sizes."
},
{
"label": "list_item",
"id": 6,
"page_no": 11,
"cluster": {
"id": 6,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 283.4,
"r": 545.1,
"b": 387.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 139,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 292.3,
"r_x1": 328.4,
"r_y1": 292.3,
"r_x2": 328.4,
"r_y2": 283.4,
"r_x3": 320.8,
"r_y3": 283.4,
"coord_origin": "TOPLEFT"
},
"text": "7.",
"orig": "7.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 140,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 330.9,
"r_y0": 292.3,
"r_x1": 545.1,
"r_y1": 292.3,
"r_x2": 545.1,
"r_y2": 283.4,
"r_x3": 330.9,
"r_y3": 283.4,
"coord_origin": "TOPLEFT"
},
"text": "Generate a new set of pair-wise matches between the",
"orig": "Generate a new set of pair-wise matches between the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 141,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 304.2,
"r_x1": 545.1,
"r_y1": 304.2,
"r_x2": 545.1,
"r_y2": 295.3,
"r_x3": 308.9,
"r_y3": 295.3,
"coord_origin": "TOPLEFT"
},
"text": "corrected bounding boxes and PDF cells. This time use a",
"orig": "corrected bounding boxes and PDF cells. This time use a",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 142,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 316.2,
"r_x1": 545.1,
"r_y1": 316.2,
"r_x2": 545.1,
"r_y2": 307.3,
"r_x3": 308.9,
"r_y3": 307.3,
"coord_origin": "TOPLEFT"
},
"text": "modified version of the IOU metric, where the area of the",
"orig": "modified version of the IOU metric, where the area of the",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 143,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 328.1,
"r_x1": 545.1,
"r_y1": 328.1,
"r_x2": 545.1,
"r_y2": 319.2,
"r_x3": 308.9,
"r_y3": 319.2,
"coord_origin": "TOPLEFT"
},
"text": "intersection between the predicted and PDF cells is divided",
"orig": "intersection between the predicted and PDF cells is divided",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 144,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 340.1,
"r_x1": 397.2,
"r_y1": 340.1,
"r_x2": 397.2,
"r_y2": 331.2,
"r_x3": 308.9,
"r_y3": 331.2,
"coord_origin": "TOPLEFT"
},
"text": "by the PDF cell area.",
"orig": "by the PDF cell area.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 145,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 403.7,
"r_y0": 340.1,
"r_x1": 545.1,
"r_y1": 340.1,
"r_x2": 545.1,
"r_y2": 331.2,
"r_x3": 403.7,
"r_y3": 331.2,
"coord_origin": "TOPLEFT"
},
"text": "In case there are multiple matches",
"orig": "In case there are multiple matches",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 146,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 352.0,
"r_x1": 545.1,
"r_y1": 352.0,
"r_x2": 545.1,
"r_y2": 343.1,
"r_x3": 308.9,
"r_y3": 343.1,
"coord_origin": "TOPLEFT"
},
"text": "for the same PDF cell, the prediction with the higher score",
"orig": "for the same PDF cell, the prediction with the higher score",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 147,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 364.0,
"r_x1": 545.1,
"r_y1": 364.0,
"r_x2": 545.1,
"r_y2": 355.1,
"r_x3": 308.9,
"r_y3": 355.1,
"coord_origin": "TOPLEFT"
},
"text": "is preferred. This covers the cases where the PDF cells are",
"orig": "is preferred. This covers the cases where the PDF cells are",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 148,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 376.0,
"r_x1": 545.1,
"r_y1": 376.0,
"r_x2": 545.1,
"r_y2": 367.0,
"r_x3": 308.9,
"r_y3": 367.0,
"coord_origin": "TOPLEFT"
},
"text": "smaller than the area of predicted or corrected prediction",
"orig": "smaller than the area of predicted or corrected prediction",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 149,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 387.9,
"r_x1": 329.6,
"r_y1": 387.9,
"r_x2": 329.6,
"r_y2": 379.0,
"r_x3": 308.9,
"r_y3": 379.0,
"coord_origin": "TOPLEFT"
},
"text": "cells.",
"orig": "cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "7. Generate a new set of pair-wise matches between the corrected bounding boxes and PDF cells. This time use a modified version of the IOU metric, where the area of the intersection between the predicted and PDF cells is divided by the PDF cell area. In case there are multiple matches for the same PDF cell, the prediction with the higher score is preferred. This covers the cases where the PDF cells are smaller than the area of predicted or corrected prediction cells."
},
{
"label": "list_item",
"id": 17,
"page_no": 11,
"cluster": {
"id": 17,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 391.3,
"r": 545.1,
"b": 460.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.87,
"cells": [
{
"index": 150,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 400.2,
"r_x1": 328.6,
"r_y1": 400.2,
"r_x2": 328.6,
"r_y2": 391.3,
"r_x3": 320.8,
"r_y3": 391.3,
"coord_origin": "TOPLEFT"
},
"text": "8.",
"orig": "8.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 151,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.1,
"r_y0": 400.2,
"r_x1": 545.1,
"r_y1": 400.2,
"r_x2": 545.1,
"r_y2": 391.3,
"r_x3": 331.1,
"r_y3": 391.3,
"coord_origin": "TOPLEFT"
},
"text": "In some rare occasions, we have noticed that Table-",
"orig": "In some rare occasions, we have noticed that Table-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 152,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 412.2,
"r_x1": 545.1,
"r_y1": 412.2,
"r_x2": 545.1,
"r_y2": 403.3,
"r_x3": 308.9,
"r_y3": 403.3,
"coord_origin": "TOPLEFT"
},
"text": "Former can confuse a single column as two. When the post-",
"orig": "Former can confuse a single column as two. When the post-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 153,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 424.1,
"r_x1": 545.1,
"r_y1": 424.1,
"r_x2": 545.1,
"r_y2": 415.2,
"r_x3": 308.9,
"r_y3": 415.2,
"coord_origin": "TOPLEFT"
},
"text": "processing steps are applied, this results with two predicted",
"orig": "processing steps are applied, this results with two predicted",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 154,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 436.1,
"r_x1": 545.1,
"r_y1": 436.1,
"r_x2": 545.1,
"r_y2": 427.2,
"r_x3": 308.9,
"r_y3": 427.2,
"coord_origin": "TOPLEFT"
},
"text": "columns pointing to the same PDF column. In such case",
"orig": "columns pointing to the same PDF column. In such case",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 155,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 448.0,
"r_x1": 545.1,
"r_y1": 448.0,
"r_x2": 545.1,
"r_y2": 439.1,
"r_x3": 308.9,
"r_y3": 439.1,
"coord_origin": "TOPLEFT"
},
"text": "we must de-duplicate the columns according to highest to-",
"orig": "we must de-duplicate the columns according to highest to-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 156,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 460.0,
"r_x1": 426.2,
"r_y1": 460.0,
"r_x2": 426.2,
"r_y2": 451.1,
"r_x3": 308.9,
"r_y3": 451.1,
"coord_origin": "TOPLEFT"
},
"text": "tal column intersection score.",
"orig": "tal column intersection score.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "8. In some rare occasions, we have noticed that TableFormer can confuse a single column as two. When the postprocessing steps are applied, this results with two predicted columns pointing to the same PDF column. In such case we must de-duplicate the columns according to highest total column intersection score."
},
{
"label": "list_item",
"id": 15,
"page_no": 11,
"cluster": {
"id": 15,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 463.4,
"r": 545.1,
"b": 567.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 157,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 472.3,
"r_x1": 328.7,
"r_y1": 472.3,
"r_x2": 328.7,
"r_y2": 463.4,
"r_x3": 320.8,
"r_y3": 463.4,
"coord_origin": "TOPLEFT"
},
"text": "9.",
"orig": "9.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 158,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 331.3,
"r_y0": 472.3,
"r_x1": 545.1,
"r_y1": 472.3,
"r_x2": 545.1,
"r_y2": 463.4,
"r_x3": 331.3,
"r_y3": 463.4,
"coord_origin": "TOPLEFT"
},
"text": "Pick up the remaining orphan cells. There could be",
"orig": "Pick up the remaining orphan cells. There could be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 159,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 484.3,
"r_x1": 545.1,
"r_y1": 484.3,
"r_x2": 545.1,
"r_y2": 475.3,
"r_x3": 308.9,
"r_y3": 475.3,
"coord_origin": "TOPLEFT"
},
"text": "cases, when after applying all the previous post-processing",
"orig": "cases, when after applying all the previous post-processing",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 160,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 496.2,
"r_x1": 545.1,
"r_y1": 496.2,
"r_x2": 545.1,
"r_y2": 487.3,
"r_x3": 308.9,
"r_y3": 487.3,
"coord_origin": "TOPLEFT"
},
"text": "steps, some PDF cells could still remain without any match",
"orig": "steps, some PDF cells could still remain without any match",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 161,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 508.2,
"r_x1": 381.9,
"r_y1": 508.2,
"r_x2": 381.9,
"r_y2": 499.3,
"r_x3": 308.9,
"r_y3": 499.3,
"coord_origin": "TOPLEFT"
},
"text": "to predicted cells.",
"orig": "to predicted cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 162,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 388.7,
"r_y0": 508.2,
"r_x1": 545.1,
"r_y1": 508.2,
"r_x2": 545.1,
"r_y2": 499.3,
"r_x3": 388.7,
"r_y3": 499.3,
"coord_origin": "TOPLEFT"
},
"text": "However, it is still possible to deduce",
"orig": "However, it is still possible to deduce",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 163,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 520.1,
"r_x1": 545.1,
"r_y1": 520.1,
"r_x2": 545.1,
"r_y2": 511.2,
"r_x3": 308.9,
"r_y3": 511.2,
"coord_origin": "TOPLEFT"
},
"text": "the correct matching for an orphan PDF cell by mapping its",
"orig": "the correct matching for an orphan PDF cell by mapping its",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 164,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 532.1,
"r_x1": 545.1,
"r_y1": 532.1,
"r_x2": 545.1,
"r_y2": 523.2,
"r_x3": 308.9,
"r_y3": 523.2,
"coord_origin": "TOPLEFT"
},
"text": "bounding box on the geometry of the grid. This mapping",
"orig": "bounding box on the geometry of the grid. This mapping",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 165,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 544.0,
"r_x1": 545.1,
"r_y1": 544.0,
"r_x2": 545.1,
"r_y2": 535.1,
"r_x3": 308.9,
"r_y3": 535.1,
"coord_origin": "TOPLEFT"
},
"text": "decides if the content of the orphan cell will be appended to",
"orig": "decides if the content of the orphan cell will be appended to",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 166,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 556.0,
"r_x1": 545.1,
"r_y1": 556.0,
"r_x2": 545.1,
"r_y2": 547.1,
"r_x3": 308.9,
"r_y3": 547.1,
"coord_origin": "TOPLEFT"
},
"text": "an already matched table cell, or a new table cell should be",
"orig": "an already matched table cell, or a new table cell should be",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 167,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 567.9,
"r_x1": 442.2,
"r_y1": 567.9,
"r_x2": 442.2,
"r_y2": 559.0,
"r_x3": 308.9,
"r_y3": 559.0,
"coord_origin": "TOPLEFT"
},
"text": "created to match with the orphan.",
"orig": "created to match with the orphan.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9. Pick up the remaining orphan cells. There could be cases, when after applying all the previous post-processing steps, some PDF cells could still remain without any match to predicted cells. However, it is still possible to deduce the correct matching for an orphan PDF cell by mapping its bounding box on the geometry of the grid. This mapping decides if the content of the orphan cell will be appended to an already matched table cell, or a new table cell should be created to match with the orphan."
},
{
"label": "text",
"id": 19,
"page_no": 11,
"cluster": {
"id": 19,
"label": "text",
"bbox": {
"l": 308.9,
"t": 571.3,
"r": 545.1,
"b": 604.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.85,
"cells": [
{
"index": 168,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 580.2,
"r_x1": 545.1,
"r_y1": 580.2,
"r_x2": 545.1,
"r_y2": 571.3,
"r_x3": 320.8,
"r_y3": 571.3,
"coord_origin": "TOPLEFT"
},
"text": "9a. Compute the top and bottom boundary of the hori-",
"orig": "9a. Compute the top and bottom boundary of the hori-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 169,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 592.2,
"r_x1": 471.6,
"r_y1": 592.2,
"r_x2": 471.6,
"r_y2": 583.3,
"r_x3": 308.9,
"r_y3": 583.3,
"coord_origin": "TOPLEFT"
},
"text": "zontal band for each grid row (min/max",
"orig": "zontal band for each grid row (min/max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 170,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 474.8,
"r_y0": 592.0,
"r_x1": 479.7,
"r_y1": 592.0,
"r_x2": 479.7,
"r_y2": 583.1,
"r_x3": 474.8,
"r_y3": 583.1,
"coord_origin": "TOPLEFT"
},
"text": "y",
"orig": "y",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 171,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 483.3,
"r_y0": 592.2,
"r_x1": 545.1,
"r_y1": 592.2,
"r_x2": 545.1,
"r_y2": 583.3,
"r_x3": 483.3,
"r_y3": 583.3,
"coord_origin": "TOPLEFT"
},
"text": "coordinates per",
"orig": "coordinates per",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 172,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 604.2,
"r_x1": 329.9,
"r_y1": 604.2,
"r_x2": 329.9,
"r_y2": 595.2,
"r_x3": 308.9,
"r_y3": 595.2,
"coord_origin": "TOPLEFT"
},
"text": "row).",
"orig": "row).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9a. Compute the top and bottom boundary of the horizontal band for each grid row (min/max y coordinates per row)."
},
{
"label": "list_item",
"id": 21,
"page_no": 11,
"cluster": {
"id": 21,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 607.6,
"r": 545.1,
"b": 628.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.77,
"cells": [
{
"index": 173,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 616.5,
"r_x1": 332.9,
"r_y1": 616.5,
"r_x2": 332.9,
"r_y2": 607.6,
"r_x3": 320.8,
"r_y3": 607.6,
"coord_origin": "TOPLEFT"
},
"text": "9b.",
"orig": "9b.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 174,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 339.9,
"r_y0": 616.5,
"r_x1": 545.1,
"r_y1": 616.5,
"r_x2": 545.1,
"r_y2": 607.6,
"r_x3": 339.9,
"r_y3": 607.6,
"coord_origin": "TOPLEFT"
},
"text": "Intersect the orphan\u2019s bounding box with the row",
"orig": "Intersect the orphan\u2019s bounding box with the row",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 175,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 628.4,
"r_x1": 495.3,
"r_y1": 628.4,
"r_x2": 495.3,
"r_y2": 619.5,
"r_x3": 308.9,
"r_y3": 619.5,
"coord_origin": "TOPLEFT"
},
"text": "bands, and map the cell to the closest grid row.",
"orig": "bands, and map the cell to the closest grid row.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9b. Intersect the orphan's bounding box with the row bands, and map the cell to the closest grid row."
},
{
"label": "list_item",
"id": 18,
"page_no": 11,
"cluster": {
"id": 18,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 631.8,
"r": 545.1,
"b": 664.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.86,
"cells": [
{
"index": 176,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 640.7,
"r_x1": 545.1,
"r_y1": 640.7,
"r_x2": 545.1,
"r_y2": 631.8,
"r_x3": 320.8,
"r_y3": 631.8,
"coord_origin": "TOPLEFT"
},
"text": "9c. Compute the left and right boundary of the vertical",
"orig": "9c. Compute the left and right boundary of the vertical",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 177,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 652.7,
"r_x1": 455.3,
"r_y1": 652.7,
"r_x2": 455.3,
"r_y2": 643.8,
"r_x3": 308.9,
"r_y3": 643.8,
"coord_origin": "TOPLEFT"
},
"text": "band for each grid column (min/max",
"orig": "band for each grid column (min/max",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 178,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 457.8,
"r_y0": 652.5,
"r_x1": 463.5,
"r_y1": 652.5,
"r_x2": 463.5,
"r_y2": 643.6,
"r_x3": 457.8,
"r_y3": 643.6,
"coord_origin": "TOPLEFT"
},
"text": "x",
"orig": "x",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 179,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 466.0,
"r_y0": 652.7,
"r_x1": 545.1,
"r_y1": 652.7,
"r_x2": 545.1,
"r_y2": 643.8,
"r_x3": 466.0,
"r_y3": 643.8,
"coord_origin": "TOPLEFT"
},
"text": "coordinates per col-",
"orig": "coordinates per col-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 180,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 664.6,
"r_x1": 332.4,
"r_y1": 664.6,
"r_x2": 332.4,
"r_y2": 655.7,
"r_x3": 308.9,
"r_y3": 655.7,
"coord_origin": "TOPLEFT"
},
"text": "umn).",
"orig": "umn).",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9c. Compute the left and right boundary of the vertical band for each grid column (min/max x coordinates per column)."
},
{
"label": "list_item",
"id": 22,
"page_no": 11,
"cluster": {
"id": 22,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 668.0,
"r": 545.1,
"b": 688.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.76,
"cells": [
{
"index": 181,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 676.9,
"r_x1": 545.1,
"r_y1": 676.9,
"r_x2": 545.1,
"r_y2": 668.0,
"r_x3": 320.8,
"r_y3": 668.0,
"coord_origin": "TOPLEFT"
},
"text": "9d. Intersect the orphan\u2019s bounding box with the column",
"orig": "9d. Intersect the orphan\u2019s bounding box with the column",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 182,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 688.9,
"r_x1": 510.6,
"r_y1": 688.9,
"r_x2": 510.6,
"r_y2": 680.0,
"r_x3": 308.9,
"r_y3": 680.0,
"coord_origin": "TOPLEFT"
},
"text": "bands, and map the cell to the closest grid column.",
"orig": "bands, and map the cell to the closest grid column.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9d. Intersect the orphan's bounding box with the column bands, and map the cell to the closest grid column."
},
{
"label": "list_item",
"id": 25,
"page_no": 11,
"cluster": {
"id": 25,
"label": "list_item",
"bbox": {
"l": 308.9,
"t": 692.3,
"r": 545.1,
"b": 713.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.7,
"cells": [
{
"index": 183,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 320.8,
"r_y0": 701.2,
"r_x1": 545.1,
"r_y1": 701.2,
"r_x2": 545.1,
"r_y2": 692.3,
"r_x3": 320.8,
"r_y3": 692.3,
"coord_origin": "TOPLEFT"
},
"text": "9e. If the table cell under the identified row and column",
"orig": "9e. If the table cell under the identified row and column",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 184,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 713.2,
"r_x1": 545.1,
"r_y1": 713.2,
"r_x2": 545.1,
"r_y2": 704.2,
"r_x3": 308.9,
"r_y3": 704.2,
"coord_origin": "TOPLEFT"
},
"text": "is not empty, extend its content with the content of the or-",
"orig": "is not empty, extend its content with the content of the or-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9e. If the table cell under the identified row and column is not empty, extend its content with the content of the or-"
}
],
"headers": [
{
"label": "page_footer",
"id": 14,
"page_no": 11,
"cluster": {
"id": 14,
"label": "page_footer",
"bbox": {
"l": 292.6,
"t": 734.1,
"r": 302.6,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 185,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "12",
"orig": "12",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "12"
}
]
}
},
{
"page_no": 12,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.1,
"r_x1": 88.8,
"r_y1": 84.1,
"r_x2": 88.8,
"r_y2": 75.2,
"r_x3": 50.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "phan cell.",
"orig": "phan cell.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 96.1,
"r_x1": 286.4,
"r_y1": 96.1,
"r_x2": 286.4,
"r_y2": 87.2,
"r_x3": 62.1,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "9f. Otherwise create a new structural cell and match it",
"orig": "9f. Otherwise create a new structural cell and match it",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 108.0,
"r_x1": 127.0,
"r_y1": 108.0,
"r_x2": 127.0,
"r_y2": 99.1,
"r_x3": 50.1,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "wit the orphan cell.",
"orig": "wit the orphan cell.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 119.8,
"r_x1": 286.4,
"r_y1": 119.8,
"r_x2": 286.4,
"r_y2": 111.2,
"r_x3": 62.1,
"r_y3": 111.2,
"coord_origin": "TOPLEFT"
},
"text": "Aditional images with examples of TableFormer predic-",
"orig": "Aditional images with examples of TableFormer predic-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 131.7,
"r_x1": 234.1,
"r_y1": 131.7,
"r_x2": 234.1,
"r_y2": 123.1,
"r_x3": 50.1,
"r_y3": 123.1,
"coord_origin": "TOPLEFT"
},
"text": "tions and post-processing can be found below.",
"orig": "tions and post-processing can be found below.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 63.3,
"r_y0": 511.0,
"r_x1": 273.1,
"r_y1": 511.0,
"r_x2": 273.1,
"r_y2": 502.1,
"r_x3": 63.3,
"r_y3": 502.1,
"coord_origin": "TOPLEFT"
},
"text": "Figure 8: Example of a table with multi-line header.",
"orig": "Figure 8: Example of a table with multi-line header.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 315.5,
"r_x1": 345.6,
"r_y1": 315.5,
"r_x2": 345.6,
"r_y2": 306.6,
"r_x3": 308.9,
"r_y3": 306.6,
"coord_origin": "TOPLEFT"
},
"text": "Figure 9:",
"orig": "Figure 9:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.8,
"r_y0": 315.5,
"r_x1": 545.1,
"r_y1": 315.5,
"r_x2": 545.1,
"r_y2": 306.6,
"r_x3": 352.8,
"r_y3": 306.6,
"coord_origin": "TOPLEFT"
},
"text": "Example of a table with big empty distance be-",
"orig": "Example of a table with big empty distance be-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 327.5,
"r_x1": 355.9,
"r_y1": 327.5,
"r_x2": 355.9,
"r_y2": 318.6,
"r_x3": 308.9,
"r_y3": 318.6,
"coord_origin": "TOPLEFT"
},
"text": "tween cells.",
"orig": "tween cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.3,
"r_y0": 689.4,
"r_x1": 541.6,
"r_y1": 689.4,
"r_x2": 541.6,
"r_y2": 680.5,
"r_x3": 312.3,
"r_y3": 680.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 10: Example of a complex table with empty cells.",
"orig": "Figure 10: Example of a complex table with empty cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 14,
"label": "text",
"bbox": {
"l": 50.1,
"t": 75.2,
"r": 88.8,
"b": 84.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.75,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.1,
"r_x1": 88.8,
"r_y1": 84.1,
"r_x2": 88.8,
"r_y2": 75.2,
"r_x3": 50.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "phan cell.",
"orig": "phan cell.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "text",
"bbox": {
"l": 50.1,
"t": 87.2,
"r": 286.4,
"b": 108.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.92,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 96.1,
"r_x1": 286.4,
"r_y1": 96.1,
"r_x2": 286.4,
"r_y2": 87.2,
"r_x3": 62.1,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "9f. Otherwise create a new structural cell and match it",
"orig": "9f. Otherwise create a new structural cell and match it",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 108.0,
"r_x1": 127.0,
"r_y1": 108.0,
"r_x2": 127.0,
"r_y2": 99.1,
"r_x3": 50.1,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "wit the orphan cell.",
"orig": "wit the orphan cell.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "text",
"bbox": {
"l": 50.1,
"t": 111.2,
"r": 286.4,
"b": 131.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 119.8,
"r_x1": 286.4,
"r_y1": 119.8,
"r_x2": 286.4,
"r_y2": 111.2,
"r_x3": 62.1,
"r_y3": 111.2,
"coord_origin": "TOPLEFT"
},
"text": "Aditional images with examples of TableFormer predic-",
"orig": "Aditional images with examples of TableFormer predic-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 131.7,
"r_x1": 234.1,
"r_y1": 131.7,
"r_x2": 234.1,
"r_y2": 123.1,
"r_x3": 50.1,
"r_y3": 123.1,
"coord_origin": "TOPLEFT"
},
"text": "tions and post-processing can be found below.",
"orig": "tions and post-processing can be found below.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 8,
"label": "caption",
"bbox": {
"l": 63.3,
"t": 502.1,
"r": 273.1,
"b": 511.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 63.3,
"r_y0": 511.0,
"r_x1": 273.1,
"r_y1": 511.0,
"r_x2": 273.1,
"r_y2": 502.1,
"r_x3": 63.3,
"r_y3": 502.1,
"coord_origin": "TOPLEFT"
},
"text": "Figure 8: Example of a table with multi-line header.",
"orig": "Figure 8: Example of a table with multi-line header.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 11,
"label": "caption",
"bbox": {
"l": 308.9,
"t": 306.6,
"r": 545.1,
"b": 327.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 315.5,
"r_x1": 345.6,
"r_y1": 315.5,
"r_x2": 345.6,
"r_y2": 306.6,
"r_x3": 308.9,
"r_y3": 306.6,
"coord_origin": "TOPLEFT"
},
"text": "Figure 9:",
"orig": "Figure 9:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.8,
"r_y0": 315.5,
"r_x1": 545.1,
"r_y1": 315.5,
"r_x2": 545.1,
"r_y2": 306.6,
"r_x3": 352.8,
"r_y3": 306.6,
"coord_origin": "TOPLEFT"
},
"text": "Example of a table with big empty distance be-",
"orig": "Example of a table with big empty distance be-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 327.5,
"r_x1": 355.9,
"r_y1": 327.5,
"r_x2": 355.9,
"r_y2": 318.6,
"r_x3": 308.9,
"r_y3": 318.6,
"coord_origin": "TOPLEFT"
},
"text": "tween cells.",
"orig": "tween cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "caption",
"bbox": {
"l": 312.3,
"t": 680.5,
"r": 541.6,
"b": 689.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.92,
"cells": [
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.3,
"r_y0": 689.4,
"r_x1": 541.6,
"r_y1": 689.4,
"r_x2": 541.6,
"r_y2": 680.5,
"r_x3": 312.3,
"r_y3": 680.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 10: Example of a complex table with empty cells.",
"orig": "Figure 10: Example of a complex table with empty cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 7,
"label": "page_footer",
"bbox": {
"l": 292.6,
"t": 734.1,
"r": 302.6,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 17,
"label": "table",
"bbox": {
"l": 310.3,
"t": 101.2,
"r": 555.8,
"b": 136.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.7,
"cells": [],
"children": []
},
{
"id": 32,
"label": "table",
"bbox": {
"l": 310.0,
"t": 154.6,
"r": 555.7,
"b": 184.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.56,
"cells": [],
"children": []
},
{
"id": 9,
"label": "table",
"bbox": {
"l": 84.0,
"t": 156.3,
"r": 239.2,
"b": 214.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [],
"children": []
},
{
"id": 21,
"label": "table",
"bbox": {
"l": 310.0,
"t": 195.7,
"r": 555.7,
"b": 233.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.66,
"cells": [],
"children": []
},
{
"id": 4,
"label": "table",
"bbox": {
"l": 82.9,
"t": 233.8,
"r": 239.2,
"b": 291.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.92,
"cells": [],
"children": []
},
{
"id": 19,
"label": "picture",
"bbox": {
"l": 309.8,
"t": 253.9,
"r": 426.0,
"b": 292.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.7,
"cells": [],
"children": []
},
{
"id": 37,
"label": "table",
"bbox": {
"l": 309.8,
"t": 253.9,
"r": 426.0,
"b": 292.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.53,
"cells": [],
"children": []
},
{
"id": 6,
"label": "table",
"bbox": {
"l": 83.9,
"t": 309.0,
"r": 239.2,
"b": 367.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [],
"children": []
},
{
"id": 12,
"label": "table",
"bbox": {
"l": 335.3,
"t": 388.5,
"r": 490.1,
"b": 437.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.85,
"cells": [],
"children": []
},
{
"id": 0,
"label": "table",
"bbox": {
"l": 83.3,
"t": 396.0,
"r": 248.9,
"b": 487.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [],
"children": []
},
{
"id": 10,
"label": "table",
"bbox": {
"l": 334.9,
"t": 453.9,
"r": 490.1,
"b": 502.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [],
"children": []
},
{
"id": 5,
"label": "table",
"bbox": {
"l": 335.3,
"t": 519.1,
"r": 490.2,
"b": 567.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [],
"children": []
},
{
"id": 13,
"label": "picture",
"bbox": {
"l": 334.0,
"t": 593.1,
"r": 518.5,
"b": 665.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.8,
"cells": [],
"children": []
},
{
"id": 30,
"label": "table",
"bbox": {
"l": 334.0,
"t": 593.1,
"r": 518.5,
"b": 665.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.59,
"cells": [],
"children": []
}
]
},
"tablestructure": {
"table_map": {
"17": {
"label": "table",
"id": 17,
"page_no": 12,
"cluster": {
"id": 17,
"label": "table",
"bbox": {
"l": 310.3,
"t": 101.2,
"r": 555.8,
"b": 136.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.7,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"32": {
"label": "table",
"id": 32,
"page_no": 12,
"cluster": {
"id": 32,
"label": "table",
"bbox": {
"l": 310.0,
"t": 154.6,
"r": 555.7,
"b": 184.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.56,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"9": {
"label": "table",
"id": 9,
"page_no": 12,
"cluster": {
"id": 9,
"label": "table",
"bbox": {
"l": 84.0,
"t": 156.3,
"r": 239.2,
"b": 214.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"21": {
"label": "table",
"id": 21,
"page_no": 12,
"cluster": {
"id": 21,
"label": "table",
"bbox": {
"l": 310.0,
"t": 195.7,
"r": 555.7,
"b": 233.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.66,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"4": {
"label": "table",
"id": 4,
"page_no": 12,
"cluster": {
"id": 4,
"label": "table",
"bbox": {
"l": 82.9,
"t": 233.8,
"r": 239.2,
"b": 291.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.92,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"37": {
"label": "table",
"id": 37,
"page_no": 12,
"cluster": {
"id": 37,
"label": "table",
"bbox": {
"l": 309.8,
"t": 253.9,
"r": 426.0,
"b": 292.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.53,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"lcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"6": {
"label": "table",
"id": 6,
"page_no": 12,
"cluster": {
"id": 6,
"label": "table",
"bbox": {
"l": 83.9,
"t": 309.0,
"r": 239.2,
"b": 367.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"12": {
"label": "table",
"id": 12,
"page_no": 12,
"cluster": {
"id": 12,
"label": "table",
"bbox": {
"l": 335.3,
"t": 388.5,
"r": 490.1,
"b": 437.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.85,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"lcel",
"lcel",
"lcel",
"lcel",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"0": {
"label": "table",
"id": 0,
"page_no": 12,
"cluster": {
"id": 0,
"label": "table",
"bbox": {
"l": 83.3,
"t": 396.0,
"r": 248.9,
"b": 487.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"10": {
"label": "table",
"id": 10,
"page_no": 12,
"cluster": {
"id": 10,
"label": "table",
"bbox": {
"l": 334.9,
"t": 453.9,
"r": 490.1,
"b": 502.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"lcel",
"ched",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"5": {
"label": "table",
"id": 5,
"page_no": 12,
"cluster": {
"id": 5,
"label": "table",
"bbox": {
"l": 335.3,
"t": 519.1,
"r": 490.2,
"b": 567.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"lcel",
"lcel",
"lcel",
"lcel",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"30": {
"label": "table",
"id": 30,
"page_no": 12,
"cluster": {
"id": 30,
"label": "table",
"bbox": {
"l": 334.0,
"t": 593.1,
"r": 518.5,
"b": 665.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.59,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
}
}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "text",
"id": 14,
"page_no": 12,
"cluster": {
"id": 14,
"label": "text",
"bbox": {
"l": 50.1,
"t": 75.2,
"r": 88.8,
"b": 84.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.75,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.1,
"r_x1": 88.8,
"r_y1": 84.1,
"r_x2": 88.8,
"r_y2": 75.2,
"r_x3": 50.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "phan cell.",
"orig": "phan cell.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "phan cell."
},
{
"label": "text",
"id": 3,
"page_no": 12,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 50.1,
"t": 87.2,
"r": 286.4,
"b": 108.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.92,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 96.1,
"r_x1": 286.4,
"r_y1": 96.1,
"r_x2": 286.4,
"r_y2": 87.2,
"r_x3": 62.1,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "9f. Otherwise create a new structural cell and match it",
"orig": "9f. Otherwise create a new structural cell and match it",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 108.0,
"r_x1": 127.0,
"r_y1": 108.0,
"r_x2": 127.0,
"r_y2": 99.1,
"r_x3": 50.1,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "wit the orphan cell.",
"orig": "wit the orphan cell.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9f. Otherwise create a new structural cell and match it wit the orphan cell."
},
{
"label": "text",
"id": 1,
"page_no": 12,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.1,
"t": 111.2,
"r": 286.4,
"b": 131.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 119.8,
"r_x1": 286.4,
"r_y1": 119.8,
"r_x2": 286.4,
"r_y2": 111.2,
"r_x3": 62.1,
"r_y3": 111.2,
"coord_origin": "TOPLEFT"
},
"text": "Aditional images with examples of TableFormer predic-",
"orig": "Aditional images with examples of TableFormer predic-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 131.7,
"r_x1": 234.1,
"r_y1": 131.7,
"r_x2": 234.1,
"r_y2": 123.1,
"r_x3": 50.1,
"r_y3": 123.1,
"coord_origin": "TOPLEFT"
},
"text": "tions and post-processing can be found below.",
"orig": "tions and post-processing can be found below.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Aditional images with examples of TableFormer predictions and post-processing can be found below."
},
{
"label": "caption",
"id": 8,
"page_no": 12,
"cluster": {
"id": 8,
"label": "caption",
"bbox": {
"l": 63.3,
"t": 502.1,
"r": 273.1,
"b": 511.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 63.3,
"r_y0": 511.0,
"r_x1": 273.1,
"r_y1": 511.0,
"r_x2": 273.1,
"r_y2": 502.1,
"r_x3": 63.3,
"r_y3": 502.1,
"coord_origin": "TOPLEFT"
},
"text": "Figure 8: Example of a table with multi-line header.",
"orig": "Figure 8: Example of a table with multi-line header.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 8: Example of a table with multi-line header."
},
{
"label": "caption",
"id": 11,
"page_no": 12,
"cluster": {
"id": 11,
"label": "caption",
"bbox": {
"l": 308.9,
"t": 306.6,
"r": 545.1,
"b": 327.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 315.5,
"r_x1": 345.6,
"r_y1": 315.5,
"r_x2": 345.6,
"r_y2": 306.6,
"r_x3": 308.9,
"r_y3": 306.6,
"coord_origin": "TOPLEFT"
},
"text": "Figure 9:",
"orig": "Figure 9:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.8,
"r_y0": 315.5,
"r_x1": 545.1,
"r_y1": 315.5,
"r_x2": 545.1,
"r_y2": 306.6,
"r_x3": 352.8,
"r_y3": 306.6,
"coord_origin": "TOPLEFT"
},
"text": "Example of a table with big empty distance be-",
"orig": "Example of a table with big empty distance be-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 327.5,
"r_x1": 355.9,
"r_y1": 327.5,
"r_x2": 355.9,
"r_y2": 318.6,
"r_x3": 308.9,
"r_y3": 318.6,
"coord_origin": "TOPLEFT"
},
"text": "tween cells.",
"orig": "tween cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 9: Example of a table with big empty distance between cells."
},
{
"label": "caption",
"id": 2,
"page_no": 12,
"cluster": {
"id": 2,
"label": "caption",
"bbox": {
"l": 312.3,
"t": 680.5,
"r": 541.6,
"b": 689.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.92,
"cells": [
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.3,
"r_y0": 689.4,
"r_x1": 541.6,
"r_y1": 689.4,
"r_x2": 541.6,
"r_y2": 680.5,
"r_x3": 312.3,
"r_y3": 680.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 10: Example of a complex table with empty cells.",
"orig": "Figure 10: Example of a complex table with empty cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 10: Example of a complex table with empty cells."
},
{
"label": "page_footer",
"id": 7,
"page_no": 12,
"cluster": {
"id": 7,
"label": "page_footer",
"bbox": {
"l": 292.6,
"t": 734.1,
"r": 302.6,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "13"
},
{
"label": "table",
"id": 17,
"page_no": 12,
"cluster": {
"id": 17,
"label": "table",
"bbox": {
"l": 310.3,
"t": 101.2,
"r": 555.8,
"b": 136.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.7,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 32,
"page_no": 12,
"cluster": {
"id": 32,
"label": "table",
"bbox": {
"l": 310.0,
"t": 154.6,
"r": 555.7,
"b": 184.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.56,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 9,
"page_no": 12,
"cluster": {
"id": 9,
"label": "table",
"bbox": {
"l": 84.0,
"t": 156.3,
"r": 239.2,
"b": 214.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 21,
"page_no": 12,
"cluster": {
"id": 21,
"label": "table",
"bbox": {
"l": 310.0,
"t": 195.7,
"r": 555.7,
"b": 233.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.66,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 4,
"page_no": 12,
"cluster": {
"id": 4,
"label": "table",
"bbox": {
"l": 82.9,
"t": 233.8,
"r": 239.2,
"b": 291.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.92,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 19,
"page_no": 12,
"cluster": {
"id": 19,
"label": "picture",
"bbox": {
"l": 309.8,
"t": 253.9,
"r": 426.0,
"b": 292.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.7,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 37,
"page_no": 12,
"cluster": {
"id": 37,
"label": "table",
"bbox": {
"l": 309.8,
"t": 253.9,
"r": 426.0,
"b": 292.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.53,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"lcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 6,
"page_no": 12,
"cluster": {
"id": 6,
"label": "table",
"bbox": {
"l": 83.9,
"t": 309.0,
"r": 239.2,
"b": 367.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 12,
"page_no": 12,
"cluster": {
"id": 12,
"label": "table",
"bbox": {
"l": 335.3,
"t": 388.5,
"r": 490.1,
"b": 437.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.85,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"lcel",
"lcel",
"lcel",
"lcel",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 0,
"page_no": 12,
"cluster": {
"id": 0,
"label": "table",
"bbox": {
"l": 83.3,
"t": 396.0,
"r": 248.9,
"b": 487.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 10,
"page_no": 12,
"cluster": {
"id": 10,
"label": "table",
"bbox": {
"l": 334.9,
"t": 453.9,
"r": 490.1,
"b": 502.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"lcel",
"ched",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 5,
"page_no": 12,
"cluster": {
"id": 5,
"label": "table",
"bbox": {
"l": 335.3,
"t": 519.1,
"r": 490.2,
"b": 567.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"lcel",
"lcel",
"lcel",
"lcel",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 13,
"page_no": 12,
"cluster": {
"id": 13,
"label": "picture",
"bbox": {
"l": 334.0,
"t": 593.1,
"r": 518.5,
"b": 665.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.8,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 30,
"page_no": 12,
"cluster": {
"id": 30,
"label": "table",
"bbox": {
"l": 334.0,
"t": 593.1,
"r": 518.5,
"b": 665.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.59,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
}
],
"body": [
{
"label": "text",
"id": 14,
"page_no": 12,
"cluster": {
"id": 14,
"label": "text",
"bbox": {
"l": 50.1,
"t": 75.2,
"r": 88.8,
"b": 84.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.75,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 84.1,
"r_x1": 88.8,
"r_y1": 84.1,
"r_x2": 88.8,
"r_y2": 75.2,
"r_x3": 50.1,
"r_y3": 75.2,
"coord_origin": "TOPLEFT"
},
"text": "phan cell.",
"orig": "phan cell.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "phan cell."
},
{
"label": "text",
"id": 3,
"page_no": 12,
"cluster": {
"id": 3,
"label": "text",
"bbox": {
"l": 50.1,
"t": 87.2,
"r": 286.4,
"b": 108.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.92,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 96.1,
"r_x1": 286.4,
"r_y1": 96.1,
"r_x2": 286.4,
"r_y2": 87.2,
"r_x3": 62.1,
"r_y3": 87.2,
"coord_origin": "TOPLEFT"
},
"text": "9f. Otherwise create a new structural cell and match it",
"orig": "9f. Otherwise create a new structural cell and match it",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 108.0,
"r_x1": 127.0,
"r_y1": 108.0,
"r_x2": 127.0,
"r_y2": 99.1,
"r_x3": 50.1,
"r_y3": 99.1,
"coord_origin": "TOPLEFT"
},
"text": "wit the orphan cell.",
"orig": "wit the orphan cell.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "9f. Otherwise create a new structural cell and match it wit the orphan cell."
},
{
"label": "text",
"id": 1,
"page_no": 12,
"cluster": {
"id": 1,
"label": "text",
"bbox": {
"l": 50.1,
"t": 111.2,
"r": 286.4,
"b": 131.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 62.1,
"r_y0": 119.8,
"r_x1": 286.4,
"r_y1": 119.8,
"r_x2": 286.4,
"r_y2": 111.2,
"r_x3": 62.1,
"r_y3": 111.2,
"coord_origin": "TOPLEFT"
},
"text": "Aditional images with examples of TableFormer predic-",
"orig": "Aditional images with examples of TableFormer predic-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 131.7,
"r_x1": 234.1,
"r_y1": 131.7,
"r_x2": 234.1,
"r_y2": 123.1,
"r_x3": 50.1,
"r_y3": 123.1,
"coord_origin": "TOPLEFT"
},
"text": "tions and post-processing can be found below.",
"orig": "tions and post-processing can be found below.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Aditional images with examples of TableFormer predictions and post-processing can be found below."
},
{
"label": "caption",
"id": 8,
"page_no": 12,
"cluster": {
"id": 8,
"label": "caption",
"bbox": {
"l": 63.3,
"t": 502.1,
"r": 273.1,
"b": 511.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 63.3,
"r_y0": 511.0,
"r_x1": 273.1,
"r_y1": 511.0,
"r_x2": 273.1,
"r_y2": 502.1,
"r_x3": 63.3,
"r_y3": 502.1,
"coord_origin": "TOPLEFT"
},
"text": "Figure 8: Example of a table with multi-line header.",
"orig": "Figure 8: Example of a table with multi-line header.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 8: Example of a table with multi-line header."
},
{
"label": "caption",
"id": 11,
"page_no": 12,
"cluster": {
"id": 11,
"label": "caption",
"bbox": {
"l": 308.9,
"t": 306.6,
"r": 545.1,
"b": 327.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 315.5,
"r_x1": 345.6,
"r_y1": 315.5,
"r_x2": 345.6,
"r_y2": 306.6,
"r_x3": 308.9,
"r_y3": 306.6,
"coord_origin": "TOPLEFT"
},
"text": "Figure 9:",
"orig": "Figure 9:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 7,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 352.8,
"r_y0": 315.5,
"r_x1": 545.1,
"r_y1": 315.5,
"r_x2": 545.1,
"r_y2": 306.6,
"r_x3": 352.8,
"r_y3": 306.6,
"coord_origin": "TOPLEFT"
},
"text": "Example of a table with big empty distance be-",
"orig": "Example of a table with big empty distance be-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 8,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 327.5,
"r_x1": 355.9,
"r_y1": 327.5,
"r_x2": 355.9,
"r_y2": 318.6,
"r_x3": 308.9,
"r_y3": 318.6,
"coord_origin": "TOPLEFT"
},
"text": "tween cells.",
"orig": "tween cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 9: Example of a table with big empty distance between cells."
},
{
"label": "caption",
"id": 2,
"page_no": 12,
"cluster": {
"id": 2,
"label": "caption",
"bbox": {
"l": 312.3,
"t": 680.5,
"r": 541.6,
"b": 689.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.92,
"cells": [
{
"index": 9,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 312.3,
"r_y0": 689.4,
"r_x1": 541.6,
"r_y1": 689.4,
"r_x2": 541.6,
"r_y2": 680.5,
"r_x3": 312.3,
"r_y3": 680.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 10: Example of a complex table with empty cells.",
"orig": "Figure 10: Example of a complex table with empty cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 10: Example of a complex table with empty cells."
},
{
"label": "table",
"id": 17,
"page_no": 12,
"cluster": {
"id": 17,
"label": "table",
"bbox": {
"l": 310.3,
"t": 101.2,
"r": 555.8,
"b": 136.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.7,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 32,
"page_no": 12,
"cluster": {
"id": 32,
"label": "table",
"bbox": {
"l": 310.0,
"t": 154.6,
"r": 555.7,
"b": 184.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.56,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 9,
"page_no": 12,
"cluster": {
"id": 9,
"label": "table",
"bbox": {
"l": 84.0,
"t": 156.3,
"r": 239.2,
"b": 214.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 21,
"page_no": 12,
"cluster": {
"id": 21,
"label": "table",
"bbox": {
"l": 310.0,
"t": 195.7,
"r": 555.7,
"b": 233.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.66,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 4,
"page_no": 12,
"cluster": {
"id": 4,
"label": "table",
"bbox": {
"l": 82.9,
"t": 233.8,
"r": 239.2,
"b": 291.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.92,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 19,
"page_no": 12,
"cluster": {
"id": 19,
"label": "picture",
"bbox": {
"l": 309.8,
"t": 253.9,
"r": 426.0,
"b": 292.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.7,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 37,
"page_no": 12,
"cluster": {
"id": 37,
"label": "table",
"bbox": {
"l": 309.8,
"t": 253.9,
"r": 426.0,
"b": 292.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.53,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"lcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 6,
"page_no": 12,
"cluster": {
"id": 6,
"label": "table",
"bbox": {
"l": 83.9,
"t": 309.0,
"r": 239.2,
"b": 367.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 12,
"page_no": 12,
"cluster": {
"id": 12,
"label": "table",
"bbox": {
"l": 335.3,
"t": 388.5,
"r": 490.1,
"b": 437.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.85,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"lcel",
"lcel",
"lcel",
"lcel",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 0,
"page_no": 12,
"cluster": {
"id": 0,
"label": "table",
"bbox": {
"l": 83.3,
"t": 396.0,
"r": 248.9,
"b": 487.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 10,
"page_no": 12,
"cluster": {
"id": 10,
"label": "table",
"bbox": {
"l": 334.9,
"t": 453.9,
"r": 490.1,
"b": 502.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.88,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"lcel",
"ched",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 5,
"page_no": 12,
"cluster": {
"id": 5,
"label": "table",
"bbox": {
"l": 335.3,
"t": 519.1,
"r": 490.2,
"b": 567.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"lcel",
"lcel",
"lcel",
"lcel",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 13,
"page_no": 12,
"cluster": {
"id": 13,
"label": "picture",
"bbox": {
"l": 334.0,
"t": 593.1,
"r": 518.5,
"b": 665.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.8,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 30,
"page_no": 12,
"cluster": {
"id": 30,
"label": "table",
"bbox": {
"l": 334.0,
"t": 593.1,
"r": 518.5,
"b": 665.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.59,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
}
],
"headers": [
{
"label": "page_footer",
"id": 7,
"page_no": 12,
"cluster": {
"id": 7,
"label": "page_footer",
"bbox": {
"l": 292.6,
"t": 734.1,
"r": 302.6,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 10,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "13",
"orig": "13",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "13"
}
]
}
},
{
"page_no": 13,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 365.7,
"r_x1": 93.1,
"r_y1": 365.7,
"r_x2": 93.1,
"r_y2": 356.8,
"r_x3": 50.1,
"r_y3": 356.8,
"coord_origin": "TOPLEFT"
},
"text": "Figure 11:",
"orig": "Figure 11:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.7,
"r_y0": 365.7,
"r_x1": 286.4,
"r_y1": 365.7,
"r_x2": 286.4,
"r_y2": 356.8,
"r_x3": 103.7,
"r_y3": 356.8,
"coord_origin": "TOPLEFT"
},
"text": "Simple table with different style and empty",
"orig": "Simple table with different style and empty",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 377.6,
"r_x1": 70.9,
"r_y1": 377.6,
"r_x2": 70.9,
"r_y2": 368.7,
"r_x3": 50.1,
"r_y3": 368.7,
"coord_origin": "TOPLEFT"
},
"text": "cells.",
"orig": "cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 680.7,
"r_x1": 281.9,
"r_y1": 680.7,
"r_x2": 281.9,
"r_y2": 671.8,
"r_x3": 54.6,
"r_y3": 671.8,
"coord_origin": "TOPLEFT"
},
"text": "Figure 12: Simple table predictions and post processing.",
"orig": "Figure 12: Simple table predictions and post processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.8,
"r_y0": 380.6,
"r_x1": 538.2,
"r_y1": 380.6,
"r_x2": 538.2,
"r_y2": 371.7,
"r_x3": 315.8,
"r_y3": 371.7,
"coord_origin": "TOPLEFT"
},
"text": "Figure 13: Table predictions example on colorful table.",
"orig": "Figure 13: Table predictions example on colorful table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.0,
"r_y0": 692.5,
"r_x1": 509.0,
"r_y1": 692.5,
"r_x2": 509.0,
"r_y2": 683.5,
"r_x3": 345.0,
"r_y3": 683.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 14: Example with multi-line text.",
"orig": "Figure 14: Example with multi-line text.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 0,
"label": "caption",
"bbox": {
"l": 50.1,
"t": 356.8,
"r": 286.4,
"b": 377.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 365.7,
"r_x1": 93.1,
"r_y1": 365.7,
"r_x2": 93.1,
"r_y2": 356.8,
"r_x3": 50.1,
"r_y3": 356.8,
"coord_origin": "TOPLEFT"
},
"text": "Figure 11:",
"orig": "Figure 11:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.7,
"r_y0": 365.7,
"r_x1": 286.4,
"r_y1": 365.7,
"r_x2": 286.4,
"r_y2": 356.8,
"r_x3": 103.7,
"r_y3": 356.8,
"coord_origin": "TOPLEFT"
},
"text": "Simple table with different style and empty",
"orig": "Simple table with different style and empty",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 377.6,
"r_x1": 70.9,
"r_y1": 377.6,
"r_x2": 70.9,
"r_y2": 368.7,
"r_x3": 50.1,
"r_y3": 368.7,
"coord_origin": "TOPLEFT"
},
"text": "cells.",
"orig": "cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "caption",
"bbox": {
"l": 54.6,
"t": 671.8,
"r": 281.9,
"b": 680.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 680.7,
"r_x1": 281.9,
"r_y1": 680.7,
"r_x2": 281.9,
"r_y2": 671.8,
"r_x3": 54.6,
"r_y3": 671.8,
"coord_origin": "TOPLEFT"
},
"text": "Figure 12: Simple table predictions and post processing.",
"orig": "Figure 12: Simple table predictions and post processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "caption",
"bbox": {
"l": 315.8,
"t": 371.7,
"r": 538.2,
"b": 380.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.92,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.8,
"r_y0": 380.6,
"r_x1": 538.2,
"r_y1": 380.6,
"r_x2": 538.2,
"r_y2": 371.7,
"r_x3": 315.8,
"r_y3": 371.7,
"coord_origin": "TOPLEFT"
},
"text": "Figure 13: Table predictions example on colorful table.",
"orig": "Figure 13: Table predictions example on colorful table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "caption",
"bbox": {
"l": 345.0,
"t": 683.5,
"r": 509.0,
"b": 692.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.92,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.0,
"r_y0": 692.5,
"r_x1": 509.0,
"r_y1": 692.5,
"r_x2": 509.0,
"r_y2": 683.5,
"r_x3": 345.0,
"r_y3": 683.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 14: Example with multi-line text.",
"orig": "Figure 14: Example with multi-line text.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 5,
"label": "page_footer",
"bbox": {
"l": 292.6,
"t": 734.1,
"r": 302.6,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 41,
"label": "picture",
"bbox": {
"l": 318.6,
"t": 90.9,
"r": 534.7,
"b": 359.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.5,
"cells": [],
"children": []
},
{
"id": 30,
"label": "picture",
"bbox": {
"l": 51.2,
"t": 104.3,
"r": 282.9,
"b": 344.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.56,
"cells": [],
"children": []
},
{
"id": 23,
"label": "table",
"bbox": {
"l": 319.0,
"t": 161.2,
"r": 534.6,
"b": 214.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.62,
"cells": [],
"children": []
},
{
"id": 33,
"label": "table",
"bbox": {
"l": 319.0,
"t": 226.1,
"r": 534.4,
"b": 279.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [],
"children": []
},
{
"id": 27,
"label": "table",
"bbox": {
"l": 51.7,
"t": 273.6,
"r": 283.1,
"b": 344.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.57,
"cells": [],
"children": []
},
{
"id": 38,
"label": "table",
"bbox": {
"l": 328.1,
"t": 288.7,
"r": 523.9,
"b": 358.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.52,
"cells": [],
"children": []
},
{
"id": 10,
"label": "table",
"bbox": {
"l": 319.5,
"t": 430.9,
"r": 518.6,
"b": 477.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [],
"children": []
},
{
"id": 9,
"label": "table",
"bbox": {
"l": 51.4,
"t": 453.5,
"r": 310.7,
"b": 491.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [],
"children": []
},
{
"id": 8,
"label": "table",
"bbox": {
"l": 320.0,
"t": 489.2,
"r": 519.1,
"b": 535.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.85,
"cells": [],
"children": []
},
{
"id": 4,
"label": "table",
"bbox": {
"l": 50.9,
"t": 504.1,
"r": 310.6,
"b": 542.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [],
"children": []
},
{
"id": 15,
"label": "table",
"bbox": {
"l": 319.8,
"t": 546.4,
"r": 519.6,
"b": 593.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.68,
"cells": [],
"children": []
},
{
"id": 6,
"label": "table",
"bbox": {
"l": 51.3,
"t": 553.7,
"r": 311.1,
"b": 591.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [],
"children": []
},
{
"id": 7,
"label": "table",
"bbox": {
"l": 319.1,
"t": 609.8,
"r": 533.8,
"b": 669.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.87,
"cells": [],
"children": []
},
{
"id": 11,
"label": "picture",
"bbox": {
"l": 50.4,
"t": 611.0,
"r": 177.1,
"b": 656.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.79,
"cells": [],
"children": []
}
]
},
"tablestructure": {
"table_map": {
"23": {
"label": "table",
"id": 23,
"page_no": 13,
"cluster": {
"id": 23,
"label": "table",
"bbox": {
"l": 319.0,
"t": 161.2,
"r": 534.6,
"b": 214.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.62,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"33": {
"label": "table",
"id": 33,
"page_no": 13,
"cluster": {
"id": 33,
"label": "table",
"bbox": {
"l": 319.0,
"t": 226.1,
"r": 534.4,
"b": 279.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"27": {
"label": "table",
"id": 27,
"page_no": 13,
"cluster": {
"id": 27,
"label": "table",
"bbox": {
"l": 51.7,
"t": 273.6,
"r": 283.1,
"b": 344.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.57,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"ecel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"38": {
"label": "table",
"id": 38,
"page_no": 13,
"cluster": {
"id": 38,
"label": "table",
"bbox": {
"l": 328.1,
"t": 288.7,
"r": 523.9,
"b": 358.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.52,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"10": {
"label": "table",
"id": 10,
"page_no": 13,
"cluster": {
"id": 10,
"label": "table",
"bbox": {
"l": 319.5,
"t": 430.9,
"r": 518.6,
"b": 477.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"9": {
"label": "table",
"id": 9,
"page_no": 13,
"cluster": {
"id": 9,
"label": "table",
"bbox": {
"l": 51.4,
"t": 453.5,
"r": 310.7,
"b": 491.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"8": {
"label": "table",
"id": 8,
"page_no": 13,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 320.0,
"t": 489.2,
"r": 519.1,
"b": 535.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.85,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"4": {
"label": "table",
"id": 4,
"page_no": 13,
"cluster": {
"id": 4,
"label": "table",
"bbox": {
"l": 50.9,
"t": 504.1,
"r": 310.6,
"b": 542.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"15": {
"label": "table",
"id": 15,
"page_no": 13,
"cluster": {
"id": 15,
"label": "table",
"bbox": {
"l": 319.8,
"t": 546.4,
"r": 519.6,
"b": 593.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.68,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"6": {
"label": "table",
"id": 6,
"page_no": 13,
"cluster": {
"id": 6,
"label": "table",
"bbox": {
"l": 51.3,
"t": 553.7,
"r": 311.1,
"b": 591.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"7": {
"label": "table",
"id": 7,
"page_no": 13,
"cluster": {
"id": 7,
"label": "table",
"bbox": {
"l": 319.1,
"t": 609.8,
"r": 533.8,
"b": 669.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.87,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
}
}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "caption",
"id": 0,
"page_no": 13,
"cluster": {
"id": 0,
"label": "caption",
"bbox": {
"l": 50.1,
"t": 356.8,
"r": 286.4,
"b": 377.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 365.7,
"r_x1": 93.1,
"r_y1": 365.7,
"r_x2": 93.1,
"r_y2": 356.8,
"r_x3": 50.1,
"r_y3": 356.8,
"coord_origin": "TOPLEFT"
},
"text": "Figure 11:",
"orig": "Figure 11:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.7,
"r_y0": 365.7,
"r_x1": 286.4,
"r_y1": 365.7,
"r_x2": 286.4,
"r_y2": 356.8,
"r_x3": 103.7,
"r_y3": 356.8,
"coord_origin": "TOPLEFT"
},
"text": "Simple table with different style and empty",
"orig": "Simple table with different style and empty",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 377.6,
"r_x1": 70.9,
"r_y1": 377.6,
"r_x2": 70.9,
"r_y2": 368.7,
"r_x3": 50.1,
"r_y3": 368.7,
"coord_origin": "TOPLEFT"
},
"text": "cells.",
"orig": "cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 11: Simple table with different style and empty cells."
},
{
"label": "caption",
"id": 1,
"page_no": 13,
"cluster": {
"id": 1,
"label": "caption",
"bbox": {
"l": 54.6,
"t": 671.8,
"r": 281.9,
"b": 680.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 680.7,
"r_x1": 281.9,
"r_y1": 680.7,
"r_x2": 281.9,
"r_y2": 671.8,
"r_x3": 54.6,
"r_y3": 671.8,
"coord_origin": "TOPLEFT"
},
"text": "Figure 12: Simple table predictions and post processing.",
"orig": "Figure 12: Simple table predictions and post processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 12: Simple table predictions and post processing."
},
{
"label": "caption",
"id": 3,
"page_no": 13,
"cluster": {
"id": 3,
"label": "caption",
"bbox": {
"l": 315.8,
"t": 371.7,
"r": 538.2,
"b": 380.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.92,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.8,
"r_y0": 380.6,
"r_x1": 538.2,
"r_y1": 380.6,
"r_x2": 538.2,
"r_y2": 371.7,
"r_x3": 315.8,
"r_y3": 371.7,
"coord_origin": "TOPLEFT"
},
"text": "Figure 13: Table predictions example on colorful table.",
"orig": "Figure 13: Table predictions example on colorful table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 13: Table predictions example on colorful table."
},
{
"label": "caption",
"id": 2,
"page_no": 13,
"cluster": {
"id": 2,
"label": "caption",
"bbox": {
"l": 345.0,
"t": 683.5,
"r": 509.0,
"b": 692.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.92,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.0,
"r_y0": 692.5,
"r_x1": 509.0,
"r_y1": 692.5,
"r_x2": 509.0,
"r_y2": 683.5,
"r_x3": 345.0,
"r_y3": 683.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 14: Example with multi-line text.",
"orig": "Figure 14: Example with multi-line text.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 14: Example with multi-line text."
},
{
"label": "page_footer",
"id": 5,
"page_no": 13,
"cluster": {
"id": 5,
"label": "page_footer",
"bbox": {
"l": 292.6,
"t": 734.1,
"r": 302.6,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "14"
},
{
"label": "picture",
"id": 41,
"page_no": 13,
"cluster": {
"id": 41,
"label": "picture",
"bbox": {
"l": 318.6,
"t": 90.9,
"r": 534.7,
"b": 359.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.5,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 30,
"page_no": 13,
"cluster": {
"id": 30,
"label": "picture",
"bbox": {
"l": 51.2,
"t": 104.3,
"r": 282.9,
"b": 344.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.56,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 23,
"page_no": 13,
"cluster": {
"id": 23,
"label": "table",
"bbox": {
"l": 319.0,
"t": 161.2,
"r": 534.6,
"b": 214.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.62,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 33,
"page_no": 13,
"cluster": {
"id": 33,
"label": "table",
"bbox": {
"l": 319.0,
"t": 226.1,
"r": 534.4,
"b": 279.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 27,
"page_no": 13,
"cluster": {
"id": 27,
"label": "table",
"bbox": {
"l": 51.7,
"t": 273.6,
"r": 283.1,
"b": 344.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.57,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"ecel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 38,
"page_no": 13,
"cluster": {
"id": 38,
"label": "table",
"bbox": {
"l": 328.1,
"t": 288.7,
"r": 523.9,
"b": 358.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.52,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 10,
"page_no": 13,
"cluster": {
"id": 10,
"label": "table",
"bbox": {
"l": 319.5,
"t": 430.9,
"r": 518.6,
"b": 477.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 9,
"page_no": 13,
"cluster": {
"id": 9,
"label": "table",
"bbox": {
"l": 51.4,
"t": 453.5,
"r": 310.7,
"b": 491.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 8,
"page_no": 13,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 320.0,
"t": 489.2,
"r": 519.1,
"b": 535.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.85,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 4,
"page_no": 13,
"cluster": {
"id": 4,
"label": "table",
"bbox": {
"l": 50.9,
"t": 504.1,
"r": 310.6,
"b": 542.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 15,
"page_no": 13,
"cluster": {
"id": 15,
"label": "table",
"bbox": {
"l": 319.8,
"t": 546.4,
"r": 519.6,
"b": 593.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.68,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 6,
"page_no": 13,
"cluster": {
"id": 6,
"label": "table",
"bbox": {
"l": 51.3,
"t": 553.7,
"r": 311.1,
"b": 591.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 7,
"page_no": 13,
"cluster": {
"id": 7,
"label": "table",
"bbox": {
"l": 319.1,
"t": 609.8,
"r": 533.8,
"b": 669.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.87,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 11,
"page_no": 13,
"cluster": {
"id": 11,
"label": "picture",
"bbox": {
"l": 50.4,
"t": 611.0,
"r": 177.1,
"b": 656.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.79,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
}
],
"body": [
{
"label": "caption",
"id": 0,
"page_no": 13,
"cluster": {
"id": 0,
"label": "caption",
"bbox": {
"l": 50.1,
"t": 356.8,
"r": 286.4,
"b": 377.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.95,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 365.7,
"r_x1": 93.1,
"r_y1": 365.7,
"r_x2": 93.1,
"r_y2": 356.8,
"r_x3": 50.1,
"r_y3": 356.8,
"coord_origin": "TOPLEFT"
},
"text": "Figure 11:",
"orig": "Figure 11:",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 103.7,
"r_y0": 365.7,
"r_x1": 286.4,
"r_y1": 365.7,
"r_x2": 286.4,
"r_y2": 356.8,
"r_x3": 103.7,
"r_y3": 356.8,
"coord_origin": "TOPLEFT"
},
"text": "Simple table with different style and empty",
"orig": "Simple table with different style and empty",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 377.6,
"r_x1": 70.9,
"r_y1": 377.6,
"r_x2": 70.9,
"r_y2": 368.7,
"r_x3": 50.1,
"r_y3": 368.7,
"coord_origin": "TOPLEFT"
},
"text": "cells.",
"orig": "cells.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 11: Simple table with different style and empty cells."
},
{
"label": "caption",
"id": 1,
"page_no": 13,
"cluster": {
"id": 1,
"label": "caption",
"bbox": {
"l": 54.6,
"t": 671.8,
"r": 281.9,
"b": 680.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 54.6,
"r_y0": 680.7,
"r_x1": 281.9,
"r_y1": 680.7,
"r_x2": 281.9,
"r_y2": 671.8,
"r_x3": 54.6,
"r_y3": 671.8,
"coord_origin": "TOPLEFT"
},
"text": "Figure 12: Simple table predictions and post processing.",
"orig": "Figure 12: Simple table predictions and post processing.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 12: Simple table predictions and post processing."
},
{
"label": "caption",
"id": 3,
"page_no": 13,
"cluster": {
"id": 3,
"label": "caption",
"bbox": {
"l": 315.8,
"t": 371.7,
"r": 538.2,
"b": 380.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.92,
"cells": [
{
"index": 4,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 315.8,
"r_y0": 380.6,
"r_x1": 538.2,
"r_y1": 380.6,
"r_x2": 538.2,
"r_y2": 371.7,
"r_x3": 315.8,
"r_y3": 371.7,
"coord_origin": "TOPLEFT"
},
"text": "Figure 13: Table predictions example on colorful table.",
"orig": "Figure 13: Table predictions example on colorful table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 13: Table predictions example on colorful table."
},
{
"label": "caption",
"id": 2,
"page_no": 13,
"cluster": {
"id": 2,
"label": "caption",
"bbox": {
"l": 345.0,
"t": 683.5,
"r": 509.0,
"b": 692.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.92,
"cells": [
{
"index": 5,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 345.0,
"r_y0": 692.5,
"r_x1": 509.0,
"r_y1": 692.5,
"r_x2": 509.0,
"r_y2": 683.5,
"r_x3": 345.0,
"r_y3": 683.5,
"coord_origin": "TOPLEFT"
},
"text": "Figure 14: Example with multi-line text.",
"orig": "Figure 14: Example with multi-line text.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 14: Example with multi-line text."
},
{
"label": "picture",
"id": 41,
"page_no": 13,
"cluster": {
"id": 41,
"label": "picture",
"bbox": {
"l": 318.6,
"t": 90.9,
"r": 534.7,
"b": 359.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.5,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 30,
"page_no": 13,
"cluster": {
"id": 30,
"label": "picture",
"bbox": {
"l": 51.2,
"t": 104.3,
"r": 282.9,
"b": 344.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.56,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 23,
"page_no": 13,
"cluster": {
"id": 23,
"label": "table",
"bbox": {
"l": 319.0,
"t": 161.2,
"r": 534.6,
"b": 214.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.62,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 33,
"page_no": 13,
"cluster": {
"id": 33,
"label": "table",
"bbox": {
"l": 319.0,
"t": 226.1,
"r": 534.4,
"b": 279.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 27,
"page_no": 13,
"cluster": {
"id": 27,
"label": "table",
"bbox": {
"l": 51.7,
"t": 273.6,
"r": 283.1,
"b": 344.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.57,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"ecel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 38,
"page_no": 13,
"cluster": {
"id": 38,
"label": "table",
"bbox": {
"l": 328.1,
"t": 288.7,
"r": 523.9,
"b": 358.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.52,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 10,
"page_no": 13,
"cluster": {
"id": 10,
"label": "table",
"bbox": {
"l": 319.5,
"t": 430.9,
"r": 518.6,
"b": 477.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 9,
"page_no": 13,
"cluster": {
"id": 9,
"label": "table",
"bbox": {
"l": 51.4,
"t": 453.5,
"r": 310.7,
"b": 491.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 8,
"page_no": 13,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 320.0,
"t": 489.2,
"r": 519.1,
"b": 535.7,
"coord_origin": "TOPLEFT"
},
"confidence": 0.85,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 4,
"page_no": 13,
"cluster": {
"id": 4,
"label": "table",
"bbox": {
"l": 50.9,
"t": 504.1,
"r": 310.6,
"b": 542.4,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 15,
"page_no": 13,
"cluster": {
"id": 15,
"label": "table",
"bbox": {
"l": 319.8,
"t": 546.4,
"r": 519.6,
"b": 593.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.68,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 6,
"page_no": 13,
"cluster": {
"id": 6,
"label": "table",
"bbox": {
"l": 51.3,
"t": 553.7,
"r": 311.1,
"b": 591.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 7,
"page_no": 13,
"cluster": {
"id": 7,
"label": "table",
"bbox": {
"l": 319.1,
"t": 609.8,
"r": 533.8,
"b": 669.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.87,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 11,
"page_no": 13,
"cluster": {
"id": 11,
"label": "picture",
"bbox": {
"l": 50.4,
"t": 611.0,
"r": 177.1,
"b": 656.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.79,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
}
],
"headers": [
{
"label": "page_footer",
"id": 5,
"page_no": 13,
"cluster": {
"id": 5,
"label": "page_footer",
"bbox": {
"l": 292.6,
"t": 734.1,
"r": 302.6,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.89,
"cells": [
{
"index": 6,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "14",
"orig": "14",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "14"
}
]
}
},
{
"page_no": 14,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 84.2,
"r_y0": 653.3,
"r_x1": 252.2,
"r_y1": 653.3,
"r_x2": 252.2,
"r_y2": 644.4,
"r_x3": 84.2,
"r_y3": 644.4,
"coord_origin": "TOPLEFT"
},
"text": "Figure 15: Example with triangular table.",
"orig": "Figure 15: Example with triangular table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 661.8,
"r_x1": 545.1,
"r_y1": 661.8,
"r_x2": 545.1,
"r_y2": 652.9,
"r_x3": 308.9,
"r_y3": 652.9,
"coord_origin": "TOPLEFT"
},
"text": "Figure 16: Example of how post-processing helps to restore",
"orig": "Figure 16: Example of how post-processing helps to restore",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 673.8,
"r_x1": 497.6,
"r_y1": 673.8,
"r_x2": 497.6,
"r_y2": 664.9,
"r_x3": 308.9,
"r_y3": 664.9,
"coord_origin": "TOPLEFT"
},
"text": "mis-aligned bounding boxes prediction artifact.",
"orig": "mis-aligned bounding boxes prediction artifact.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 0,
"label": "caption",
"bbox": {
"l": 84.2,
"t": 644.4,
"r": 252.2,
"b": 653.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 84.2,
"r_y0": 653.3,
"r_x1": 252.2,
"r_y1": 653.3,
"r_x2": 252.2,
"r_y2": 644.4,
"r_x3": 84.2,
"r_y3": 644.4,
"coord_origin": "TOPLEFT"
},
"text": "Figure 15: Example with triangular table.",
"orig": "Figure 15: Example with triangular table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "caption",
"bbox": {
"l": 308.9,
"t": 652.9,
"r": 545.1,
"b": 673.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 661.8,
"r_x1": 545.1,
"r_y1": 661.8,
"r_x2": 545.1,
"r_y2": 652.9,
"r_x3": 308.9,
"r_y3": 652.9,
"coord_origin": "TOPLEFT"
},
"text": "Figure 16: Example of how post-processing helps to restore",
"orig": "Figure 16: Example of how post-processing helps to restore",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 673.8,
"r_x1": 497.6,
"r_y1": 673.8,
"r_x2": 497.6,
"r_y2": 664.9,
"r_x3": 308.9,
"r_y3": 664.9,
"coord_origin": "TOPLEFT"
},
"text": "mis-aligned bounding boxes prediction artifact.",
"orig": "mis-aligned bounding boxes prediction artifact.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 3,
"label": "page_footer",
"bbox": {
"l": 292.6,
"t": 734.1,
"r": 302.6,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 4,
"label": "table",
"bbox": {
"l": 323.0,
"t": 121.5,
"r": 526.0,
"b": 222.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.86,
"cells": [],
"children": []
},
{
"id": 6,
"label": "picture",
"bbox": {
"l": 55.1,
"t": 136.3,
"r": 279.4,
"b": 249.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.81,
"cells": [],
"children": []
},
{
"id": 19,
"label": "table",
"bbox": {
"l": 55.1,
"t": 136.3,
"r": 279.4,
"b": 249.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.56,
"cells": [],
"children": []
},
{
"id": 2,
"label": "table",
"bbox": {
"l": 323.4,
"t": 242.0,
"r": 526.1,
"b": 344.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [],
"children": []
},
{
"id": 18,
"label": "picture",
"bbox": {
"l": 54.3,
"t": 260.3,
"r": 279.3,
"b": 373.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.57,
"cells": [],
"children": []
},
{
"id": 10,
"label": "table",
"bbox": {
"l": 54.3,
"t": 260.3,
"r": 279.3,
"b": 373.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.77,
"cells": [],
"children": []
},
{
"id": 20,
"label": "picture",
"bbox": {
"l": 323.5,
"t": 362.5,
"r": 526.0,
"b": 464.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [],
"children": []
},
{
"id": 9,
"label": "table",
"bbox": {
"l": 323.5,
"t": 362.5,
"r": 526.0,
"b": 464.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.78,
"cells": [],
"children": []
},
{
"id": 5,
"label": "picture",
"bbox": {
"l": 55.4,
"t": 384.6,
"r": 280.2,
"b": 497.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [],
"children": []
},
{
"id": 22,
"label": "picture",
"bbox": {
"l": 353.7,
"t": 487.4,
"r": 495.4,
"b": 635.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [],
"children": []
},
{
"id": 8,
"label": "table",
"bbox": {
"l": 353.7,
"t": 487.4,
"r": 495.4,
"b": 635.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.78,
"cells": [],
"children": []
},
{
"id": 7,
"label": "picture",
"bbox": {
"l": 50.6,
"t": 506.0,
"r": 319.9,
"b": 631.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.81,
"cells": [],
"children": []
},
{
"id": 11,
"label": "table",
"bbox": {
"l": 50.6,
"t": 506.0,
"r": 319.9,
"b": 631.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.68,
"cells": [],
"children": []
}
]
},
"tablestructure": {
"table_map": {
"4": {
"label": "table",
"id": 4,
"page_no": 14,
"cluster": {
"id": 4,
"label": "table",
"bbox": {
"l": 323.0,
"t": 121.5,
"r": 526.0,
"b": 222.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.86,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"19": {
"label": "table",
"id": 19,
"page_no": 14,
"cluster": {
"id": 19,
"label": "table",
"bbox": {
"l": 55.1,
"t": 136.3,
"r": 279.4,
"b": 249.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.56,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"2": {
"label": "table",
"id": 2,
"page_no": 14,
"cluster": {
"id": 2,
"label": "table",
"bbox": {
"l": 323.4,
"t": 242.0,
"r": 526.1,
"b": 344.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"10": {
"label": "table",
"id": 10,
"page_no": 14,
"cluster": {
"id": 10,
"label": "table",
"bbox": {
"l": 54.3,
"t": 260.3,
"r": 279.3,
"b": 373.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.77,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"9": {
"label": "table",
"id": 9,
"page_no": 14,
"cluster": {
"id": 9,
"label": "table",
"bbox": {
"l": 323.5,
"t": 362.5,
"r": 526.0,
"b": 464.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.78,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"8": {
"label": "table",
"id": 8,
"page_no": 14,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 353.7,
"t": 487.4,
"r": 495.4,
"b": 635.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.78,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
"11": {
"label": "table",
"id": 11,
"page_no": 14,
"cluster": {
"id": 11,
"label": "table",
"bbox": {
"l": 50.6,
"t": 506.0,
"r": 319.9,
"b": 631.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.68,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
}
}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "caption",
"id": 0,
"page_no": 14,
"cluster": {
"id": 0,
"label": "caption",
"bbox": {
"l": 84.2,
"t": 644.4,
"r": 252.2,
"b": 653.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 84.2,
"r_y0": 653.3,
"r_x1": 252.2,
"r_y1": 653.3,
"r_x2": 252.2,
"r_y2": 644.4,
"r_x3": 84.2,
"r_y3": 644.4,
"coord_origin": "TOPLEFT"
},
"text": "Figure 15: Example with triangular table.",
"orig": "Figure 15: Example with triangular table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 15: Example with triangular table."
},
{
"label": "caption",
"id": 1,
"page_no": 14,
"cluster": {
"id": 1,
"label": "caption",
"bbox": {
"l": 308.9,
"t": 652.9,
"r": 545.1,
"b": 673.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 661.8,
"r_x1": 545.1,
"r_y1": 661.8,
"r_x2": 545.1,
"r_y2": 652.9,
"r_x3": 308.9,
"r_y3": 652.9,
"coord_origin": "TOPLEFT"
},
"text": "Figure 16: Example of how post-processing helps to restore",
"orig": "Figure 16: Example of how post-processing helps to restore",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 673.8,
"r_x1": 497.6,
"r_y1": 673.8,
"r_x2": 497.6,
"r_y2": 664.9,
"r_x3": 308.9,
"r_y3": 664.9,
"coord_origin": "TOPLEFT"
},
"text": "mis-aligned bounding boxes prediction artifact.",
"orig": "mis-aligned bounding boxes prediction artifact.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 16: Example of how post-processing helps to restore mis-aligned bounding boxes prediction artifact."
},
{
"label": "page_footer",
"id": 3,
"page_no": 14,
"cluster": {
"id": 3,
"label": "page_footer",
"bbox": {
"l": 292.6,
"t": 734.1,
"r": 302.6,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "15"
},
{
"label": "table",
"id": 4,
"page_no": 14,
"cluster": {
"id": 4,
"label": "table",
"bbox": {
"l": 323.0,
"t": 121.5,
"r": 526.0,
"b": 222.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.86,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 6,
"page_no": 14,
"cluster": {
"id": 6,
"label": "picture",
"bbox": {
"l": 55.1,
"t": 136.3,
"r": 279.4,
"b": 249.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.81,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 19,
"page_no": 14,
"cluster": {
"id": 19,
"label": "table",
"bbox": {
"l": 55.1,
"t": 136.3,
"r": 279.4,
"b": 249.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.56,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 2,
"page_no": 14,
"cluster": {
"id": 2,
"label": "table",
"bbox": {
"l": 323.4,
"t": 242.0,
"r": 526.1,
"b": 344.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 18,
"page_no": 14,
"cluster": {
"id": 18,
"label": "picture",
"bbox": {
"l": 54.3,
"t": 260.3,
"r": 279.3,
"b": 373.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.57,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 10,
"page_no": 14,
"cluster": {
"id": 10,
"label": "table",
"bbox": {
"l": 54.3,
"t": 260.3,
"r": 279.3,
"b": 373.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.77,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 20,
"page_no": 14,
"cluster": {
"id": 20,
"label": "picture",
"bbox": {
"l": 323.5,
"t": 362.5,
"r": 526.0,
"b": 464.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 9,
"page_no": 14,
"cluster": {
"id": 9,
"label": "table",
"bbox": {
"l": 323.5,
"t": 362.5,
"r": 526.0,
"b": 464.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.78,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 5,
"page_no": 14,
"cluster": {
"id": 5,
"label": "picture",
"bbox": {
"l": 55.4,
"t": 384.6,
"r": 280.2,
"b": 497.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 22,
"page_no": 14,
"cluster": {
"id": 22,
"label": "picture",
"bbox": {
"l": 353.7,
"t": 487.4,
"r": 495.4,
"b": 635.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 8,
"page_no": 14,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 353.7,
"t": 487.4,
"r": 495.4,
"b": 635.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.78,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 7,
"page_no": 14,
"cluster": {
"id": 7,
"label": "picture",
"bbox": {
"l": 50.6,
"t": 506.0,
"r": 319.9,
"b": 631.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.81,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 11,
"page_no": 14,
"cluster": {
"id": 11,
"label": "table",
"bbox": {
"l": 50.6,
"t": 506.0,
"r": 319.9,
"b": 631.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.68,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
}
],
"body": [
{
"label": "caption",
"id": 0,
"page_no": 14,
"cluster": {
"id": 0,
"label": "caption",
"bbox": {
"l": 84.2,
"t": 644.4,
"r": 252.2,
"b": 653.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.93,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 84.2,
"r_y0": 653.3,
"r_x1": 252.2,
"r_y1": 653.3,
"r_x2": 252.2,
"r_y2": 644.4,
"r_x3": 84.2,
"r_y3": 644.4,
"coord_origin": "TOPLEFT"
},
"text": "Figure 15: Example with triangular table.",
"orig": "Figure 15: Example with triangular table.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 15: Example with triangular table."
},
{
"label": "caption",
"id": 1,
"page_no": 14,
"cluster": {
"id": 1,
"label": "caption",
"bbox": {
"l": 308.9,
"t": 652.9,
"r": 545.1,
"b": 673.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 661.8,
"r_x1": 545.1,
"r_y1": 661.8,
"r_x2": 545.1,
"r_y2": 652.9,
"r_x3": 308.9,
"r_y3": 652.9,
"coord_origin": "TOPLEFT"
},
"text": "Figure 16: Example of how post-processing helps to restore",
"orig": "Figure 16: Example of how post-processing helps to restore",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 308.9,
"r_y0": 673.8,
"r_x1": 497.6,
"r_y1": 673.8,
"r_x2": 497.6,
"r_y2": 664.9,
"r_x3": 308.9,
"r_y3": 664.9,
"coord_origin": "TOPLEFT"
},
"text": "mis-aligned bounding boxes prediction artifact.",
"orig": "mis-aligned bounding boxes prediction artifact.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 16: Example of how post-processing helps to restore mis-aligned bounding boxes prediction artifact."
},
{
"label": "table",
"id": 4,
"page_no": 14,
"cluster": {
"id": 4,
"label": "table",
"bbox": {
"l": 323.0,
"t": 121.5,
"r": 526.0,
"b": 222.9,
"coord_origin": "TOPLEFT"
},
"confidence": 0.86,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 6,
"page_no": 14,
"cluster": {
"id": 6,
"label": "picture",
"bbox": {
"l": 55.1,
"t": 136.3,
"r": 279.4,
"b": 249.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.81,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 19,
"page_no": 14,
"cluster": {
"id": 19,
"label": "table",
"bbox": {
"l": 55.1,
"t": 136.3,
"r": 279.4,
"b": 249.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.56,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ecel",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"rhed",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"rhed",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"ecel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "table",
"id": 2,
"page_no": 14,
"cluster": {
"id": 2,
"label": "table",
"bbox": {
"l": 323.4,
"t": 242.0,
"r": 526.1,
"b": 344.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 18,
"page_no": 14,
"cluster": {
"id": 18,
"label": "picture",
"bbox": {
"l": 54.3,
"t": 260.3,
"r": 279.3,
"b": 373.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.57,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 10,
"page_no": 14,
"cluster": {
"id": 10,
"label": "table",
"bbox": {
"l": 54.3,
"t": 260.3,
"r": 279.3,
"b": 373.5,
"coord_origin": "TOPLEFT"
},
"confidence": 0.77,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 20,
"page_no": 14,
"cluster": {
"id": 20,
"label": "picture",
"bbox": {
"l": 323.5,
"t": 362.5,
"r": 526.0,
"b": 464.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 9,
"page_no": 14,
"cluster": {
"id": 9,
"label": "table",
"bbox": {
"l": 323.5,
"t": 362.5,
"r": 526.0,
"b": 464.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.78,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl",
"rhed",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 5,
"page_no": 14,
"cluster": {
"id": 5,
"label": "picture",
"bbox": {
"l": 55.4,
"t": 384.6,
"r": 280.2,
"b": 497.6,
"coord_origin": "TOPLEFT"
},
"confidence": 0.84,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "picture",
"id": 22,
"page_no": 14,
"cluster": {
"id": 22,
"label": "picture",
"bbox": {
"l": 353.7,
"t": 487.4,
"r": 495.4,
"b": 635.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.55,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 8,
"page_no": 14,
"cluster": {
"id": 8,
"label": "table",
"bbox": {
"l": 353.7,
"t": 487.4,
"r": 495.4,
"b": 635.8,
"coord_origin": "TOPLEFT"
},
"confidence": 0.78,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"fcel",
"ched",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
},
{
"label": "picture",
"id": 7,
"page_no": 14,
"cluster": {
"id": 7,
"label": "picture",
"bbox": {
"l": 50.6,
"t": 506.0,
"r": 319.9,
"b": 631.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.81,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
},
{
"label": "table",
"id": 11,
"page_no": 14,
"cluster": {
"id": 11,
"label": "table",
"bbox": {
"l": 50.6,
"t": 506.0,
"r": 319.9,
"b": 631.3,
"coord_origin": "TOPLEFT"
},
"confidence": 0.68,
"cells": [],
"children": []
},
"text": null,
"otsl_seq": [
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"ched",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"fcel",
"nl"
],
"num_rows": 0,
"num_cols": 0,
"table_cells": []
}
],
"headers": [
{
"label": "page_footer",
"id": 3,
"page_no": 14,
"cluster": {
"id": 3,
"label": "page_footer",
"bbox": {
"l": 292.6,
"t": 734.1,
"r": 302.6,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.9,
"cells": [
{
"index": 3,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "15",
"orig": "15",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "15"
}
]
}
},
{
"page_no": 15,
"size": {
"width": 612.0,
"height": 792.0
},
"parsed_page": {
"dimension": {
"angle": 0.0,
"rect": {
"r_x0": 0.0,
"r_y0": 0.0,
"r_x1": 612.0,
"r_y1": 0.0,
"r_x2": 612.0,
"r_y2": 792.0,
"r_x3": 0.0,
"r_y3": 792.0,
"coord_origin": "BOTTOMLEFT"
},
"boundary_type": "crop_box",
"art_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"bleed_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"crop_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"media_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
},
"trim_bbox": {
"l": 0.0,
"t": 792.0,
"r": 612.0,
"b": 0.0,
"coord_origin": "BOTTOMLEFT"
}
},
"bitmap_resources": [],
"char_cells": [],
"word_cells": [],
"textline_cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 517.2,
"r_x1": 545.1,
"r_y1": 517.2,
"r_x2": 545.1,
"r_y2": 508.3,
"r_x3": 50.1,
"r_y3": 508.3,
"coord_origin": "TOPLEFT"
},
"text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-",
"orig": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 529.2,
"r_x1": 173.2,
"r_y1": 529.2,
"r_x2": 173.2,
"r_y2": 520.3,
"r_x3": 50.1,
"r_y3": 520.3,
"coord_origin": "TOPLEFT"
},
"text": "ing and prediction of structure.",
"orig": "ing and prediction of structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"has_chars": false,
"has_words": false,
"has_lines": true,
"image": null,
"lines": []
},
"predictions": {
"layout": {
"clusters": [
{
"id": 0,
"label": "caption",
"bbox": {
"l": 50.1,
"t": 508.3,
"r": 545.1,
"b": 529.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 517.2,
"r_x1": 545.1,
"r_y1": 517.2,
"r_x2": 545.1,
"r_y2": 508.3,
"r_x3": 50.1,
"r_y3": 508.3,
"coord_origin": "TOPLEFT"
},
"text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-",
"orig": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 529.2,
"r_x1": 173.2,
"r_y1": 529.2,
"r_x2": 173.2,
"r_y2": 520.3,
"r_x3": 50.1,
"r_y3": 520.3,
"coord_origin": "TOPLEFT"
},
"text": "ing and prediction of structure.",
"orig": "ing and prediction of structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 1,
"label": "page_footer",
"bbox": {
"l": 292.6,
"t": 734.1,
"r": 302.6,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
{
"id": 2,
"label": "picture",
"bbox": {
"l": 66.8,
"t": 253.6,
"r": 528.6,
"b": 498.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.69,
"cells": [],
"children": []
}
]
},
"tablestructure": {
"table_map": {}
},
"figures_classification": null,
"equations_prediction": null,
"vlm_response": null
},
"assembled": {
"elements": [
{
"label": "caption",
"id": 0,
"page_no": 15,
"cluster": {
"id": 0,
"label": "caption",
"bbox": {
"l": 50.1,
"t": 508.3,
"r": 545.1,
"b": 529.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 517.2,
"r_x1": 545.1,
"r_y1": 517.2,
"r_x2": 545.1,
"r_y2": 508.3,
"r_x3": 50.1,
"r_y3": 508.3,
"coord_origin": "TOPLEFT"
},
"text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-",
"orig": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 529.2,
"r_x1": 173.2,
"r_y1": 529.2,
"r_x2": 173.2,
"r_y2": 520.3,
"r_x3": 50.1,
"r_y3": 520.3,
"coord_origin": "TOPLEFT"
},
"text": "ing and prediction of structure.",
"orig": "ing and prediction of structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post processing and prediction of structure."
},
{
"label": "page_footer",
"id": 1,
"page_no": 15,
"cluster": {
"id": 1,
"label": "page_footer",
"bbox": {
"l": 292.6,
"t": 734.1,
"r": 302.6,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "16"
},
{
"label": "picture",
"id": 2,
"page_no": 15,
"cluster": {
"id": 2,
"label": "picture",
"bbox": {
"l": 66.8,
"t": 253.6,
"r": 528.6,
"b": 498.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.69,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
}
],
"body": [
{
"label": "caption",
"id": 0,
"page_no": 15,
"cluster": {
"id": 0,
"label": "caption",
"bbox": {
"l": 50.1,
"t": 508.3,
"r": 545.1,
"b": 529.2,
"coord_origin": "TOPLEFT"
},
"confidence": 0.96,
"cells": [
{
"index": 0,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 517.2,
"r_x1": 545.1,
"r_y1": 517.2,
"r_x2": 545.1,
"r_y2": 508.3,
"r_x3": 50.1,
"r_y3": 508.3,
"coord_origin": "TOPLEFT"
},
"text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-",
"orig": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
},
{
"index": 1,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 50.1,
"r_y0": 529.2,
"r_x1": 173.2,
"r_y1": 529.2,
"r_x2": 173.2,
"r_y2": 520.3,
"r_x3": 50.1,
"r_y3": 520.3,
"coord_origin": "TOPLEFT"
},
"text": "ing and prediction of structure.",
"orig": "ing and prediction of structure.",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post processing and prediction of structure."
},
{
"label": "picture",
"id": 2,
"page_no": 15,
"cluster": {
"id": 2,
"label": "picture",
"bbox": {
"l": 66.8,
"t": 253.6,
"r": 528.6,
"b": 498.1,
"coord_origin": "TOPLEFT"
},
"confidence": 0.69,
"cells": [],
"children": []
},
"text": "",
"annotations": [],
"provenance": null,
"predicted_class": null,
"confidence": null
}
],
"headers": [
{
"label": "page_footer",
"id": 1,
"page_no": 15,
"cluster": {
"id": 1,
"label": "page_footer",
"bbox": {
"l": 292.6,
"t": 734.1,
"r": 302.6,
"b": 743.0,
"coord_origin": "TOPLEFT"
},
"confidence": 0.91,
"cells": [
{
"index": 2,
"rgba": {
"r": 0,
"g": 0,
"b": 0,
"a": 255
},
"rect": {
"r_x0": 292.6,
"r_y0": 743.0,
"r_x1": 302.6,
"r_y1": 743.0,
"r_x2": 302.6,
"r_y2": 734.1,
"r_x3": 292.6,
"r_y3": 734.1,
"coord_origin": "TOPLEFT"
},
"text": "16",
"orig": "16",
"text_direction": "left_to_right",
"confidence": 1.0,
"from_ocr": false
}
],
"children": []
},
"text": "16"
}
]
}
}
] |